{ "best_metric": null, "best_model_checkpoint": null, "epoch": 1.999968595825129, "global_step": 79606, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, "learning_rate": 0.002999623143984122, "loss": 3.9921, "step": 10 }, { "epoch": 0.0, "learning_rate": 0.0029992462879682436, "loss": 1.5317, "step": 20 }, { "epoch": 0.0, "learning_rate": 0.0029988694319523653, "loss": 1.2121, "step": 30 }, { "epoch": 0.0, "learning_rate": 0.0029984925759364875, "loss": 1.0693, "step": 40 }, { "epoch": 0.0, "learning_rate": 0.0029981157199206092, "loss": 0.9832, "step": 50 }, { "epoch": 0.0, "learning_rate": 0.0029977388639047305, "loss": 0.925, "step": 60 }, { "epoch": 0.0, "learning_rate": 0.0029973620078888527, "loss": 0.8599, "step": 70 }, { "epoch": 0.0, "learning_rate": 0.0029969851518729745, "loss": 0.8426, "step": 80 }, { "epoch": 0.0, "learning_rate": 0.002996608295857096, "loss": 0.8016, "step": 90 }, { "epoch": 0.0, "learning_rate": 0.002996231439841218, "loss": 0.7594, "step": 100 }, { "epoch": 0.0, "learning_rate": 0.0029958545838253397, "loss": 0.7358, "step": 110 }, { "epoch": 0.0, "learning_rate": 0.002995477727809462, "loss": 0.7094, "step": 120 }, { "epoch": 0.0, "learning_rate": 0.0029951008717935836, "loss": 0.7043, "step": 130 }, { "epoch": 0.0, "learning_rate": 0.0029947240157777054, "loss": 0.6813, "step": 140 }, { "epoch": 0.0, "learning_rate": 0.002994347159761827, "loss": 0.671, "step": 150 }, { "epoch": 0.0, "learning_rate": 0.002993970303745949, "loss": 0.6486, "step": 160 }, { "epoch": 0.0, "learning_rate": 0.002993593447730071, "loss": 0.6395, "step": 170 }, { "epoch": 0.0, "learning_rate": 0.0029932165917141923, "loss": 0.6361, "step": 180 }, { "epoch": 0.0, "learning_rate": 0.002992839735698314, "loss": 0.6132, "step": 190 }, { "epoch": 0.01, "learning_rate": 0.0029924628796824363, "loss": 0.6038, "step": 200 }, { "epoch": 0.01, "learning_rate": 0.002992086023666558, "loss": 0.5928, "step": 210 }, { "epoch": 0.01, "learning_rate": 0.0029917091676506797, "loss": 0.5775, "step": 220 }, { "epoch": 0.01, "learning_rate": 0.0029913323116348015, "loss": 0.5844, "step": 230 }, { "epoch": 0.01, "learning_rate": 0.0029909554556189232, "loss": 0.561, "step": 240 }, { "epoch": 0.01, "learning_rate": 0.002990578599603045, "loss": 0.5629, "step": 250 }, { "epoch": 0.01, "learning_rate": 0.0029902017435871667, "loss": 0.5413, "step": 260 }, { "epoch": 0.01, "learning_rate": 0.0029898248875712885, "loss": 0.5516, "step": 270 }, { "epoch": 0.01, "learning_rate": 0.0029894480315554106, "loss": 0.5345, "step": 280 }, { "epoch": 0.01, "learning_rate": 0.002989071175539532, "loss": 0.5332, "step": 290 }, { "epoch": 0.01, "learning_rate": 0.002988694319523654, "loss": 0.5317, "step": 300 }, { "epoch": 0.01, "learning_rate": 0.002988317463507776, "loss": 0.521, "step": 310 }, { "epoch": 0.01, "learning_rate": 0.0029879406074918976, "loss": 0.5091, "step": 320 }, { "epoch": 0.01, "learning_rate": 0.0029875637514760194, "loss": 0.5108, "step": 330 }, { "epoch": 0.01, "learning_rate": 0.002987186895460141, "loss": 0.4999, "step": 340 }, { "epoch": 0.01, "learning_rate": 0.0029868100394442633, "loss": 0.5046, "step": 350 }, { "epoch": 0.01, "learning_rate": 0.002986433183428385, "loss": 0.4958, "step": 360 }, { "epoch": 0.01, "learning_rate": 0.0029860563274125063, "loss": 0.4948, "step": 370 }, { "epoch": 0.01, "learning_rate": 0.0029856794713966285, "loss": 0.4778, "step": 380 }, { "epoch": 0.01, "learning_rate": 0.0029853026153807503, "loss": 0.4669, "step": 390 }, { "epoch": 0.01, "learning_rate": 0.002984925759364872, "loss": 0.4694, "step": 400 }, { "epoch": 0.01, "learning_rate": 0.0029845489033489938, "loss": 0.4669, "step": 410 }, { "epoch": 0.01, "learning_rate": 0.0029841720473331155, "loss": 0.4618, "step": 420 }, { "epoch": 0.01, "learning_rate": 0.0029837951913172377, "loss": 0.4561, "step": 430 }, { "epoch": 0.01, "learning_rate": 0.0029834183353013594, "loss": 0.4558, "step": 440 }, { "epoch": 0.01, "learning_rate": 0.002983041479285481, "loss": 0.4625, "step": 450 }, { "epoch": 0.01, "learning_rate": 0.002982664623269603, "loss": 0.4507, "step": 460 }, { "epoch": 0.01, "learning_rate": 0.0029822877672537247, "loss": 0.4496, "step": 470 }, { "epoch": 0.01, "learning_rate": 0.0029819109112378464, "loss": 0.4435, "step": 480 }, { "epoch": 0.01, "learning_rate": 0.002981534055221968, "loss": 0.4396, "step": 490 }, { "epoch": 0.01, "learning_rate": 0.00298115719920609, "loss": 0.444, "step": 500 }, { "epoch": 0.01, "eval_cer": 0.6732715529832191, "eval_loss": 0.33886468410491943, "eval_runtime": 90.4817, "eval_samples_per_second": 110.508, "eval_steps_per_second": 6.907, "step": 500 }, { "epoch": 0.01, "learning_rate": 0.002980780343190212, "loss": 0.4308, "step": 510 }, { "epoch": 0.01, "learning_rate": 0.0029804034871743334, "loss": 0.4287, "step": 520 }, { "epoch": 0.01, "learning_rate": 0.0029800266311584556, "loss": 0.4156, "step": 530 }, { "epoch": 0.01, "learning_rate": 0.0029796497751425773, "loss": 0.4347, "step": 540 }, { "epoch": 0.01, "learning_rate": 0.002979272919126699, "loss": 0.4347, "step": 550 }, { "epoch": 0.01, "learning_rate": 0.002978896063110821, "loss": 0.4227, "step": 560 }, { "epoch": 0.01, "learning_rate": 0.0029785192070949425, "loss": 0.4235, "step": 570 }, { "epoch": 0.01, "learning_rate": 0.0029781423510790647, "loss": 0.4185, "step": 580 }, { "epoch": 0.01, "learning_rate": 0.0029777654950631865, "loss": 0.419, "step": 590 }, { "epoch": 0.02, "learning_rate": 0.0029773886390473078, "loss": 0.4138, "step": 600 }, { "epoch": 0.02, "learning_rate": 0.00297701178303143, "loss": 0.4028, "step": 610 }, { "epoch": 0.02, "learning_rate": 0.0029766349270155517, "loss": 0.4085, "step": 620 }, { "epoch": 0.02, "learning_rate": 0.0029762580709996734, "loss": 0.4033, "step": 630 }, { "epoch": 0.02, "learning_rate": 0.002975881214983795, "loss": 0.3989, "step": 640 }, { "epoch": 0.02, "learning_rate": 0.002975504358967917, "loss": 0.3959, "step": 650 }, { "epoch": 0.02, "learning_rate": 0.002975127502952039, "loss": 0.3925, "step": 660 }, { "epoch": 0.02, "learning_rate": 0.0029747506469361604, "loss": 0.395, "step": 670 }, { "epoch": 0.02, "learning_rate": 0.002974373790920282, "loss": 0.3885, "step": 680 }, { "epoch": 0.02, "learning_rate": 0.0029739969349044043, "loss": 0.3886, "step": 690 }, { "epoch": 0.02, "learning_rate": 0.002973620078888526, "loss": 0.3905, "step": 700 }, { "epoch": 0.02, "learning_rate": 0.002973243222872648, "loss": 0.3884, "step": 710 }, { "epoch": 0.02, "learning_rate": 0.0029728663668567696, "loss": 0.3947, "step": 720 }, { "epoch": 0.02, "learning_rate": 0.0029724895108408913, "loss": 0.3868, "step": 730 }, { "epoch": 0.02, "learning_rate": 0.0029721126548250135, "loss": 0.3832, "step": 740 }, { "epoch": 0.02, "learning_rate": 0.002971735798809135, "loss": 0.3848, "step": 750 }, { "epoch": 0.02, "learning_rate": 0.002971358942793257, "loss": 0.3766, "step": 760 }, { "epoch": 0.02, "learning_rate": 0.0029709820867773787, "loss": 0.3797, "step": 770 }, { "epoch": 0.02, "learning_rate": 0.0029706052307615005, "loss": 0.3786, "step": 780 }, { "epoch": 0.02, "learning_rate": 0.0029702283747456222, "loss": 0.3694, "step": 790 }, { "epoch": 0.02, "learning_rate": 0.002969851518729744, "loss": 0.373, "step": 800 }, { "epoch": 0.02, "learning_rate": 0.0029694746627138657, "loss": 0.371, "step": 810 }, { "epoch": 0.02, "learning_rate": 0.002969097806697988, "loss": 0.3584, "step": 820 }, { "epoch": 0.02, "learning_rate": 0.002968720950682109, "loss": 0.3691, "step": 830 }, { "epoch": 0.02, "learning_rate": 0.0029683440946662314, "loss": 0.3656, "step": 840 }, { "epoch": 0.02, "learning_rate": 0.002967967238650353, "loss": 0.3662, "step": 850 }, { "epoch": 0.02, "learning_rate": 0.002967590382634475, "loss": 0.3619, "step": 860 }, { "epoch": 0.02, "learning_rate": 0.0029672135266185966, "loss": 0.3613, "step": 870 }, { "epoch": 0.02, "learning_rate": 0.0029668366706027184, "loss": 0.3551, "step": 880 }, { "epoch": 0.02, "learning_rate": 0.0029664598145868405, "loss": 0.371, "step": 890 }, { "epoch": 0.02, "learning_rate": 0.002966082958570962, "loss": 0.35, "step": 900 }, { "epoch": 0.02, "learning_rate": 0.0029657061025550836, "loss": 0.3464, "step": 910 }, { "epoch": 0.02, "learning_rate": 0.0029653292465392058, "loss": 0.3441, "step": 920 }, { "epoch": 0.02, "learning_rate": 0.0029649523905233275, "loss": 0.3513, "step": 930 }, { "epoch": 0.02, "learning_rate": 0.0029645755345074493, "loss": 0.3452, "step": 940 }, { "epoch": 0.02, "learning_rate": 0.002964198678491571, "loss": 0.3483, "step": 950 }, { "epoch": 0.02, "learning_rate": 0.0029638218224756928, "loss": 0.3463, "step": 960 }, { "epoch": 0.02, "learning_rate": 0.002963444966459815, "loss": 0.3423, "step": 970 }, { "epoch": 0.02, "learning_rate": 0.0029630681104439362, "loss": 0.3441, "step": 980 }, { "epoch": 0.02, "learning_rate": 0.0029626912544280584, "loss": 0.3489, "step": 990 }, { "epoch": 0.03, "learning_rate": 0.00296231439841218, "loss": 0.3429, "step": 1000 }, { "epoch": 0.03, "eval_cer": 0.6705959123333078, "eval_loss": 0.26553666591644287, "eval_runtime": 90.2108, "eval_samples_per_second": 110.84, "eval_steps_per_second": 6.928, "step": 1000 }, { "epoch": 0.03, "learning_rate": 0.002961937542396302, "loss": 0.3388, "step": 1010 }, { "epoch": 0.03, "learning_rate": 0.0029615606863804237, "loss": 0.3408, "step": 1020 }, { "epoch": 0.03, "learning_rate": 0.0029611838303645454, "loss": 0.3431, "step": 1030 }, { "epoch": 0.03, "learning_rate": 0.002960806974348667, "loss": 0.3392, "step": 1040 }, { "epoch": 0.03, "learning_rate": 0.0029604301183327893, "loss": 0.3382, "step": 1050 }, { "epoch": 0.03, "learning_rate": 0.0029600532623169106, "loss": 0.3425, "step": 1060 }, { "epoch": 0.03, "learning_rate": 0.002959676406301033, "loss": 0.3345, "step": 1070 }, { "epoch": 0.03, "learning_rate": 0.0029592995502851546, "loss": 0.3368, "step": 1080 }, { "epoch": 0.03, "learning_rate": 0.0029589226942692763, "loss": 0.3377, "step": 1090 }, { "epoch": 0.03, "learning_rate": 0.002958545838253398, "loss": 0.3267, "step": 1100 }, { "epoch": 0.03, "learning_rate": 0.00295816898223752, "loss": 0.332, "step": 1110 }, { "epoch": 0.03, "learning_rate": 0.0029577921262216415, "loss": 0.3262, "step": 1120 }, { "epoch": 0.03, "learning_rate": 0.0029574152702057633, "loss": 0.3305, "step": 1130 }, { "epoch": 0.03, "learning_rate": 0.002957038414189885, "loss": 0.3259, "step": 1140 }, { "epoch": 0.03, "learning_rate": 0.002956661558174007, "loss": 0.3221, "step": 1150 }, { "epoch": 0.03, "learning_rate": 0.002956284702158129, "loss": 0.3286, "step": 1160 }, { "epoch": 0.03, "learning_rate": 0.0029559078461422507, "loss": 0.3246, "step": 1170 }, { "epoch": 0.03, "learning_rate": 0.0029555309901263724, "loss": 0.3159, "step": 1180 }, { "epoch": 0.03, "learning_rate": 0.002955154134110494, "loss": 0.3159, "step": 1190 }, { "epoch": 0.03, "learning_rate": 0.0029547772780946164, "loss": 0.3244, "step": 1200 }, { "epoch": 0.03, "learning_rate": 0.0029544004220787377, "loss": 0.3265, "step": 1210 }, { "epoch": 0.03, "learning_rate": 0.0029540235660628594, "loss": 0.317, "step": 1220 }, { "epoch": 0.03, "learning_rate": 0.0029536467100469816, "loss": 0.3051, "step": 1230 }, { "epoch": 0.03, "learning_rate": 0.0029532698540311033, "loss": 0.3192, "step": 1240 }, { "epoch": 0.03, "learning_rate": 0.002952892998015225, "loss": 0.3194, "step": 1250 }, { "epoch": 0.03, "learning_rate": 0.002952516141999347, "loss": 0.3129, "step": 1260 }, { "epoch": 0.03, "learning_rate": 0.0029521392859834686, "loss": 0.3141, "step": 1270 }, { "epoch": 0.03, "learning_rate": 0.0029517624299675907, "loss": 0.3176, "step": 1280 }, { "epoch": 0.03, "learning_rate": 0.002951385573951712, "loss": 0.3152, "step": 1290 }, { "epoch": 0.03, "learning_rate": 0.0029510087179358342, "loss": 0.311, "step": 1300 }, { "epoch": 0.03, "learning_rate": 0.002950631861919956, "loss": 0.3164, "step": 1310 }, { "epoch": 0.03, "learning_rate": 0.0029502550059040777, "loss": 0.3056, "step": 1320 }, { "epoch": 0.03, "learning_rate": 0.0029498781498881995, "loss": 0.3124, "step": 1330 }, { "epoch": 0.03, "learning_rate": 0.002949501293872321, "loss": 0.3016, "step": 1340 }, { "epoch": 0.03, "learning_rate": 0.002949124437856443, "loss": 0.2999, "step": 1350 }, { "epoch": 0.03, "learning_rate": 0.0029487475818405647, "loss": 0.3043, "step": 1360 }, { "epoch": 0.03, "learning_rate": 0.0029483707258246864, "loss": 0.3036, "step": 1370 }, { "epoch": 0.03, "learning_rate": 0.0029479938698088086, "loss": 0.305, "step": 1380 }, { "epoch": 0.03, "learning_rate": 0.0029476170137929304, "loss": 0.3019, "step": 1390 }, { "epoch": 0.04, "learning_rate": 0.002947240157777052, "loss": 0.3098, "step": 1400 }, { "epoch": 0.04, "learning_rate": 0.002946863301761174, "loss": 0.2971, "step": 1410 }, { "epoch": 0.04, "learning_rate": 0.0029464864457452956, "loss": 0.3018, "step": 1420 }, { "epoch": 0.04, "learning_rate": 0.0029461095897294174, "loss": 0.3037, "step": 1430 }, { "epoch": 0.04, "learning_rate": 0.002945732733713539, "loss": 0.3026, "step": 1440 }, { "epoch": 0.04, "learning_rate": 0.002945355877697661, "loss": 0.2994, "step": 1450 }, { "epoch": 0.04, "learning_rate": 0.002944979021681783, "loss": 0.3042, "step": 1460 }, { "epoch": 0.04, "learning_rate": 0.0029446021656659048, "loss": 0.3, "step": 1470 }, { "epoch": 0.04, "learning_rate": 0.0029442253096500265, "loss": 0.2954, "step": 1480 }, { "epoch": 0.04, "learning_rate": 0.0029438484536341483, "loss": 0.2995, "step": 1490 }, { "epoch": 0.04, "learning_rate": 0.00294347159761827, "loss": 0.2914, "step": 1500 }, { "epoch": 0.04, "eval_cer": 0.6704616490704796, "eval_loss": 0.22774317860603333, "eval_runtime": 90.4054, "eval_samples_per_second": 110.602, "eval_steps_per_second": 6.913, "step": 1500 }, { "epoch": 0.04, "learning_rate": 0.002943094741602392, "loss": 0.2932, "step": 1510 }, { "epoch": 0.04, "learning_rate": 0.0029427178855865135, "loss": 0.2942, "step": 1520 }, { "epoch": 0.04, "learning_rate": 0.0029423410295706352, "loss": 0.2952, "step": 1530 }, { "epoch": 0.04, "learning_rate": 0.0029419641735547574, "loss": 0.2902, "step": 1540 }, { "epoch": 0.04, "learning_rate": 0.002941587317538879, "loss": 0.2969, "step": 1550 }, { "epoch": 0.04, "learning_rate": 0.002941210461523001, "loss": 0.2905, "step": 1560 }, { "epoch": 0.04, "learning_rate": 0.0029408336055071226, "loss": 0.2959, "step": 1570 }, { "epoch": 0.04, "learning_rate": 0.0029404567494912444, "loss": 0.2942, "step": 1580 }, { "epoch": 0.04, "learning_rate": 0.002940079893475366, "loss": 0.2969, "step": 1590 }, { "epoch": 0.04, "learning_rate": 0.002939703037459488, "loss": 0.2973, "step": 1600 }, { "epoch": 0.04, "learning_rate": 0.00293932618144361, "loss": 0.2976, "step": 1610 }, { "epoch": 0.04, "learning_rate": 0.002938949325427732, "loss": 0.2824, "step": 1620 }, { "epoch": 0.04, "learning_rate": 0.002938572469411853, "loss": 0.2918, "step": 1630 }, { "epoch": 0.04, "learning_rate": 0.0029381956133959753, "loss": 0.2897, "step": 1640 }, { "epoch": 0.04, "learning_rate": 0.002937818757380097, "loss": 0.2859, "step": 1650 }, { "epoch": 0.04, "learning_rate": 0.0029374419013642188, "loss": 0.279, "step": 1660 }, { "epoch": 0.04, "learning_rate": 0.0029370650453483405, "loss": 0.2871, "step": 1670 }, { "epoch": 0.04, "learning_rate": 0.0029366881893324623, "loss": 0.2826, "step": 1680 }, { "epoch": 0.04, "learning_rate": 0.0029363113333165844, "loss": 0.2859, "step": 1690 }, { "epoch": 0.04, "learning_rate": 0.002935934477300706, "loss": 0.2864, "step": 1700 }, { "epoch": 0.04, "learning_rate": 0.002935557621284828, "loss": 0.2808, "step": 1710 }, { "epoch": 0.04, "learning_rate": 0.0029351807652689497, "loss": 0.2775, "step": 1720 }, { "epoch": 0.04, "learning_rate": 0.0029348039092530714, "loss": 0.2812, "step": 1730 }, { "epoch": 0.04, "learning_rate": 0.0029344270532371936, "loss": 0.2762, "step": 1740 }, { "epoch": 0.04, "learning_rate": 0.002934050197221315, "loss": 0.281, "step": 1750 }, { "epoch": 0.04, "learning_rate": 0.0029336733412054367, "loss": 0.2811, "step": 1760 }, { "epoch": 0.04, "learning_rate": 0.002933296485189559, "loss": 0.2765, "step": 1770 }, { "epoch": 0.04, "learning_rate": 0.00293291962917368, "loss": 0.2847, "step": 1780 }, { "epoch": 0.04, "learning_rate": 0.0029325427731578023, "loss": 0.2843, "step": 1790 }, { "epoch": 0.05, "learning_rate": 0.002932165917141924, "loss": 0.2789, "step": 1800 }, { "epoch": 0.05, "learning_rate": 0.002931789061126046, "loss": 0.2844, "step": 1810 }, { "epoch": 0.05, "learning_rate": 0.0029314122051101676, "loss": 0.2748, "step": 1820 }, { "epoch": 0.05, "learning_rate": 0.0029310353490942893, "loss": 0.2743, "step": 1830 }, { "epoch": 0.05, "learning_rate": 0.002930658493078411, "loss": 0.2745, "step": 1840 }, { "epoch": 0.05, "learning_rate": 0.0029302816370625332, "loss": 0.2697, "step": 1850 }, { "epoch": 0.05, "learning_rate": 0.0029299047810466545, "loss": 0.273, "step": 1860 }, { "epoch": 0.05, "learning_rate": 0.0029295279250307767, "loss": 0.2713, "step": 1870 }, { "epoch": 0.05, "learning_rate": 0.0029291510690148985, "loss": 0.2791, "step": 1880 }, { "epoch": 0.05, "learning_rate": 0.00292877421299902, "loss": 0.2731, "step": 1890 }, { "epoch": 0.05, "learning_rate": 0.002928397356983142, "loss": 0.2713, "step": 1900 }, { "epoch": 0.05, "learning_rate": 0.0029280205009672637, "loss": 0.2793, "step": 1910 }, { "epoch": 0.05, "learning_rate": 0.002927643644951386, "loss": 0.2729, "step": 1920 }, { "epoch": 0.05, "learning_rate": 0.0029272667889355076, "loss": 0.2725, "step": 1930 }, { "epoch": 0.05, "learning_rate": 0.002926889932919629, "loss": 0.2697, "step": 1940 }, { "epoch": 0.05, "learning_rate": 0.002926513076903751, "loss": 0.2684, "step": 1950 }, { "epoch": 0.05, "learning_rate": 0.002926136220887873, "loss": 0.276, "step": 1960 }, { "epoch": 0.05, "learning_rate": 0.0029257593648719946, "loss": 0.2778, "step": 1970 }, { "epoch": 0.05, "learning_rate": 0.0029253825088561163, "loss": 0.2716, "step": 1980 }, { "epoch": 0.05, "learning_rate": 0.002925005652840238, "loss": 0.2677, "step": 1990 }, { "epoch": 0.05, "learning_rate": 0.0029246287968243603, "loss": 0.264, "step": 2000 }, { "epoch": 0.05, "eval_cer": 0.6698235376492957, "eval_loss": 0.20776917040348053, "eval_runtime": 90.9557, "eval_samples_per_second": 109.933, "eval_steps_per_second": 6.871, "step": 2000 }, { "epoch": 0.05, "learning_rate": 0.0029242519408084816, "loss": 0.2685, "step": 2010 }, { "epoch": 0.05, "learning_rate": 0.0029238750847926038, "loss": 0.2688, "step": 2020 }, { "epoch": 0.05, "learning_rate": 0.0029234982287767255, "loss": 0.2665, "step": 2030 }, { "epoch": 0.05, "learning_rate": 0.0029231213727608472, "loss": 0.2673, "step": 2040 }, { "epoch": 0.05, "learning_rate": 0.002922744516744969, "loss": 0.2602, "step": 2050 }, { "epoch": 0.05, "learning_rate": 0.0029223676607290907, "loss": 0.2632, "step": 2060 }, { "epoch": 0.05, "learning_rate": 0.0029219908047132125, "loss": 0.2626, "step": 2070 }, { "epoch": 0.05, "learning_rate": 0.0029216139486973347, "loss": 0.2667, "step": 2080 }, { "epoch": 0.05, "learning_rate": 0.002921237092681456, "loss": 0.2591, "step": 2090 }, { "epoch": 0.05, "learning_rate": 0.002920860236665578, "loss": 0.2577, "step": 2100 }, { "epoch": 0.05, "learning_rate": 0.0029204833806497, "loss": 0.2624, "step": 2110 }, { "epoch": 0.05, "learning_rate": 0.0029201065246338216, "loss": 0.257, "step": 2120 }, { "epoch": 0.05, "learning_rate": 0.0029197296686179434, "loss": 0.2583, "step": 2130 }, { "epoch": 0.05, "learning_rate": 0.002919352812602065, "loss": 0.2672, "step": 2140 }, { "epoch": 0.05, "learning_rate": 0.0029189759565861873, "loss": 0.2578, "step": 2150 }, { "epoch": 0.05, "learning_rate": 0.002918599100570309, "loss": 0.2549, "step": 2160 }, { "epoch": 0.05, "learning_rate": 0.0029182222445544304, "loss": 0.2643, "step": 2170 }, { "epoch": 0.05, "learning_rate": 0.0029178453885385525, "loss": 0.2617, "step": 2180 }, { "epoch": 0.06, "learning_rate": 0.0029174685325226743, "loss": 0.2536, "step": 2190 }, { "epoch": 0.06, "learning_rate": 0.002917091676506796, "loss": 0.2598, "step": 2200 }, { "epoch": 0.06, "learning_rate": 0.0029167148204909178, "loss": 0.2618, "step": 2210 }, { "epoch": 0.06, "learning_rate": 0.0029163379644750395, "loss": 0.2543, "step": 2220 }, { "epoch": 0.06, "learning_rate": 0.0029159611084591617, "loss": 0.2563, "step": 2230 }, { "epoch": 0.06, "learning_rate": 0.002915584252443283, "loss": 0.2618, "step": 2240 }, { "epoch": 0.06, "learning_rate": 0.0029152073964274047, "loss": 0.256, "step": 2250 }, { "epoch": 0.06, "learning_rate": 0.002914830540411527, "loss": 0.2554, "step": 2260 }, { "epoch": 0.06, "learning_rate": 0.0029144536843956487, "loss": 0.2555, "step": 2270 }, { "epoch": 0.06, "learning_rate": 0.0029140768283797704, "loss": 0.2533, "step": 2280 }, { "epoch": 0.06, "learning_rate": 0.002913699972363892, "loss": 0.2577, "step": 2290 }, { "epoch": 0.06, "learning_rate": 0.002913323116348014, "loss": 0.2526, "step": 2300 }, { "epoch": 0.06, "learning_rate": 0.002912946260332136, "loss": 0.2536, "step": 2310 }, { "epoch": 0.06, "learning_rate": 0.0029125694043162574, "loss": 0.2562, "step": 2320 }, { "epoch": 0.06, "learning_rate": 0.0029121925483003796, "loss": 0.2537, "step": 2330 }, { "epoch": 0.06, "learning_rate": 0.0029118156922845013, "loss": 0.2543, "step": 2340 }, { "epoch": 0.06, "learning_rate": 0.002911438836268623, "loss": 0.2562, "step": 2350 }, { "epoch": 0.06, "learning_rate": 0.002911061980252745, "loss": 0.2556, "step": 2360 }, { "epoch": 0.06, "learning_rate": 0.0029106851242368665, "loss": 0.2523, "step": 2370 }, { "epoch": 0.06, "learning_rate": 0.0029103082682209883, "loss": 0.253, "step": 2380 }, { "epoch": 0.06, "learning_rate": 0.0029099314122051105, "loss": 0.2479, "step": 2390 }, { "epoch": 0.06, "learning_rate": 0.002909554556189232, "loss": 0.2521, "step": 2400 }, { "epoch": 0.06, "learning_rate": 0.002909177700173354, "loss": 0.2561, "step": 2410 }, { "epoch": 0.06, "learning_rate": 0.0029088008441574757, "loss": 0.2518, "step": 2420 }, { "epoch": 0.06, "learning_rate": 0.0029084239881415975, "loss": 0.2552, "step": 2430 }, { "epoch": 0.06, "learning_rate": 0.002908047132125719, "loss": 0.2483, "step": 2440 }, { "epoch": 0.06, "learning_rate": 0.002907670276109841, "loss": 0.2593, "step": 2450 }, { "epoch": 0.06, "learning_rate": 0.002907293420093963, "loss": 0.2491, "step": 2460 }, { "epoch": 0.06, "learning_rate": 0.0029069165640780844, "loss": 0.2454, "step": 2470 }, { "epoch": 0.06, "learning_rate": 0.002906539708062206, "loss": 0.2516, "step": 2480 }, { "epoch": 0.06, "learning_rate": 0.0029061628520463284, "loss": 0.2493, "step": 2490 }, { "epoch": 0.06, "learning_rate": 0.00290578599603045, "loss": 0.2506, "step": 2500 }, { "epoch": 0.06, "eval_cer": 0.6693986112655058, "eval_loss": 0.18936096131801605, "eval_runtime": 90.6775, "eval_samples_per_second": 110.27, "eval_steps_per_second": 6.893, "step": 2500 }, { "epoch": 0.06, "learning_rate": 0.002905409140014572, "loss": 0.2495, "step": 2510 }, { "epoch": 0.06, "learning_rate": 0.0029050322839986936, "loss": 0.2504, "step": 2520 }, { "epoch": 0.06, "learning_rate": 0.0029046554279828153, "loss": 0.2385, "step": 2530 }, { "epoch": 0.06, "learning_rate": 0.0029042785719669375, "loss": 0.2492, "step": 2540 }, { "epoch": 0.06, "learning_rate": 0.002903901715951059, "loss": 0.2449, "step": 2550 }, { "epoch": 0.06, "learning_rate": 0.002903524859935181, "loss": 0.2387, "step": 2560 }, { "epoch": 0.06, "learning_rate": 0.0029031480039193027, "loss": 0.2418, "step": 2570 }, { "epoch": 0.06, "learning_rate": 0.0029027711479034245, "loss": 0.2452, "step": 2580 }, { "epoch": 0.07, "learning_rate": 0.0029023942918875462, "loss": 0.2497, "step": 2590 }, { "epoch": 0.07, "learning_rate": 0.002902017435871668, "loss": 0.2436, "step": 2600 }, { "epoch": 0.07, "learning_rate": 0.0029016405798557897, "loss": 0.2504, "step": 2610 }, { "epoch": 0.07, "learning_rate": 0.002901263723839912, "loss": 0.2471, "step": 2620 }, { "epoch": 0.07, "learning_rate": 0.002900886867824033, "loss": 0.2429, "step": 2630 }, { "epoch": 0.07, "learning_rate": 0.0029005100118081554, "loss": 0.2513, "step": 2640 }, { "epoch": 0.07, "learning_rate": 0.002900133155792277, "loss": 0.2373, "step": 2650 }, { "epoch": 0.07, "learning_rate": 0.002899756299776399, "loss": 0.2415, "step": 2660 }, { "epoch": 0.07, "learning_rate": 0.0028993794437605206, "loss": 0.2429, "step": 2670 }, { "epoch": 0.07, "learning_rate": 0.0028990025877446424, "loss": 0.2436, "step": 2680 }, { "epoch": 0.07, "learning_rate": 0.002898625731728764, "loss": 0.2379, "step": 2690 }, { "epoch": 0.07, "learning_rate": 0.002898248875712886, "loss": 0.2465, "step": 2700 }, { "epoch": 0.07, "learning_rate": 0.0028978720196970076, "loss": 0.2431, "step": 2710 }, { "epoch": 0.07, "learning_rate": 0.0028974951636811298, "loss": 0.24, "step": 2720 }, { "epoch": 0.07, "learning_rate": 0.0028971183076652515, "loss": 0.2464, "step": 2730 }, { "epoch": 0.07, "learning_rate": 0.0028967414516493733, "loss": 0.2404, "step": 2740 }, { "epoch": 0.07, "learning_rate": 0.002896364595633495, "loss": 0.2333, "step": 2750 }, { "epoch": 0.07, "learning_rate": 0.0028959877396176168, "loss": 0.2332, "step": 2760 }, { "epoch": 0.07, "learning_rate": 0.002895610883601739, "loss": 0.2387, "step": 2770 }, { "epoch": 0.07, "learning_rate": 0.0028952340275858602, "loss": 0.2393, "step": 2780 }, { "epoch": 0.07, "learning_rate": 0.002894857171569982, "loss": 0.2314, "step": 2790 }, { "epoch": 0.07, "learning_rate": 0.002894480315554104, "loss": 0.2372, "step": 2800 }, { "epoch": 0.07, "learning_rate": 0.002894103459538226, "loss": 0.2377, "step": 2810 }, { "epoch": 0.07, "learning_rate": 0.0028937266035223477, "loss": 0.2341, "step": 2820 }, { "epoch": 0.07, "learning_rate": 0.0028933497475064694, "loss": 0.2339, "step": 2830 }, { "epoch": 0.07, "learning_rate": 0.002892972891490591, "loss": 0.2373, "step": 2840 }, { "epoch": 0.07, "learning_rate": 0.0028925960354747133, "loss": 0.2328, "step": 2850 }, { "epoch": 0.07, "learning_rate": 0.0028922191794588346, "loss": 0.2343, "step": 2860 }, { "epoch": 0.07, "learning_rate": 0.002891842323442957, "loss": 0.2344, "step": 2870 }, { "epoch": 0.07, "learning_rate": 0.0028914654674270786, "loss": 0.2309, "step": 2880 }, { "epoch": 0.07, "learning_rate": 0.0028910886114112003, "loss": 0.234, "step": 2890 }, { "epoch": 0.07, "learning_rate": 0.002890711755395322, "loss": 0.2315, "step": 2900 }, { "epoch": 0.07, "learning_rate": 0.002890334899379444, "loss": 0.2377, "step": 2910 }, { "epoch": 0.07, "learning_rate": 0.0028899580433635655, "loss": 0.24, "step": 2920 }, { "epoch": 0.07, "learning_rate": 0.0028895811873476873, "loss": 0.2387, "step": 2930 }, { "epoch": 0.07, "learning_rate": 0.002889204331331809, "loss": 0.2373, "step": 2940 }, { "epoch": 0.07, "learning_rate": 0.002888827475315931, "loss": 0.2401, "step": 2950 }, { "epoch": 0.07, "learning_rate": 0.002888450619300053, "loss": 0.2361, "step": 2960 }, { "epoch": 0.07, "learning_rate": 0.0028880737632841747, "loss": 0.233, "step": 2970 }, { "epoch": 0.07, "learning_rate": 0.0028876969072682964, "loss": 0.2341, "step": 2980 }, { "epoch": 0.08, "learning_rate": 0.002887320051252418, "loss": 0.229, "step": 2990 }, { "epoch": 0.08, "learning_rate": 0.00288694319523654, "loss": 0.2305, "step": 3000 }, { "epoch": 0.08, "eval_cer": 0.6684963043916599, "eval_loss": 0.17874853312969208, "eval_runtime": 90.9659, "eval_samples_per_second": 109.92, "eval_steps_per_second": 6.871, "step": 3000 }, { "epoch": 0.08, "learning_rate": 0.0028865663392206617, "loss": 0.2329, "step": 3010 }, { "epoch": 0.08, "learning_rate": 0.0028861894832047834, "loss": 0.2329, "step": 3020 }, { "epoch": 0.08, "learning_rate": 0.0028858126271889056, "loss": 0.2329, "step": 3030 }, { "epoch": 0.08, "learning_rate": 0.0028854357711730273, "loss": 0.2301, "step": 3040 }, { "epoch": 0.08, "learning_rate": 0.002885058915157149, "loss": 0.2323, "step": 3050 }, { "epoch": 0.08, "learning_rate": 0.002884682059141271, "loss": 0.2234, "step": 3060 }, { "epoch": 0.08, "learning_rate": 0.0028843052031253926, "loss": 0.2317, "step": 3070 }, { "epoch": 0.08, "learning_rate": 0.0028839283471095148, "loss": 0.2335, "step": 3080 }, { "epoch": 0.08, "learning_rate": 0.002883551491093636, "loss": 0.2269, "step": 3090 }, { "epoch": 0.08, "learning_rate": 0.002883174635077758, "loss": 0.2328, "step": 3100 }, { "epoch": 0.08, "learning_rate": 0.00288279777906188, "loss": 0.2229, "step": 3110 }, { "epoch": 0.08, "learning_rate": 0.0028824209230460013, "loss": 0.227, "step": 3120 }, { "epoch": 0.08, "learning_rate": 0.0028820440670301235, "loss": 0.2255, "step": 3130 }, { "epoch": 0.08, "learning_rate": 0.0028816672110142452, "loss": 0.2209, "step": 3140 }, { "epoch": 0.08, "learning_rate": 0.002881290354998367, "loss": 0.2268, "step": 3150 }, { "epoch": 0.08, "learning_rate": 0.0028809134989824887, "loss": 0.2293, "step": 3160 }, { "epoch": 0.08, "learning_rate": 0.0028805366429666105, "loss": 0.2217, "step": 3170 }, { "epoch": 0.08, "learning_rate": 0.0028801597869507326, "loss": 0.2275, "step": 3180 }, { "epoch": 0.08, "learning_rate": 0.0028797829309348544, "loss": 0.2229, "step": 3190 }, { "epoch": 0.08, "learning_rate": 0.0028794060749189757, "loss": 0.2225, "step": 3200 }, { "epoch": 0.08, "learning_rate": 0.002879029218903098, "loss": 0.226, "step": 3210 }, { "epoch": 0.08, "learning_rate": 0.0028786523628872196, "loss": 0.226, "step": 3220 }, { "epoch": 0.08, "learning_rate": 0.0028782755068713414, "loss": 0.2239, "step": 3230 }, { "epoch": 0.08, "learning_rate": 0.002877898650855463, "loss": 0.2209, "step": 3240 }, { "epoch": 0.08, "learning_rate": 0.002877521794839585, "loss": 0.2225, "step": 3250 }, { "epoch": 0.08, "learning_rate": 0.002877144938823707, "loss": 0.2221, "step": 3260 }, { "epoch": 0.08, "learning_rate": 0.0028767680828078288, "loss": 0.2255, "step": 3270 }, { "epoch": 0.08, "learning_rate": 0.0028763912267919505, "loss": 0.2274, "step": 3280 }, { "epoch": 0.08, "learning_rate": 0.0028760143707760723, "loss": 0.2235, "step": 3290 }, { "epoch": 0.08, "learning_rate": 0.002875637514760194, "loss": 0.2264, "step": 3300 }, { "epoch": 0.08, "learning_rate": 0.002875260658744316, "loss": 0.2243, "step": 3310 }, { "epoch": 0.08, "learning_rate": 0.0028748838027284375, "loss": 0.2303, "step": 3320 }, { "epoch": 0.08, "learning_rate": 0.0028745069467125592, "loss": 0.2169, "step": 3330 }, { "epoch": 0.08, "learning_rate": 0.0028741300906966814, "loss": 0.2245, "step": 3340 }, { "epoch": 0.08, "learning_rate": 0.0028737532346808027, "loss": 0.219, "step": 3350 }, { "epoch": 0.08, "learning_rate": 0.002873376378664925, "loss": 0.2223, "step": 3360 }, { "epoch": 0.08, "learning_rate": 0.0028729995226490466, "loss": 0.2171, "step": 3370 }, { "epoch": 0.08, "learning_rate": 0.0028726226666331684, "loss": 0.2232, "step": 3380 }, { "epoch": 0.09, "learning_rate": 0.00287224581061729, "loss": 0.2228, "step": 3390 }, { "epoch": 0.09, "learning_rate": 0.002871868954601412, "loss": 0.2229, "step": 3400 }, { "epoch": 0.09, "learning_rate": 0.0028714920985855336, "loss": 0.2141, "step": 3410 }, { "epoch": 0.09, "learning_rate": 0.002871115242569656, "loss": 0.2212, "step": 3420 }, { "epoch": 0.09, "learning_rate": 0.002870738386553777, "loss": 0.2329, "step": 3430 }, { "epoch": 0.09, "learning_rate": 0.0028703615305378993, "loss": 0.2172, "step": 3440 }, { "epoch": 0.09, "learning_rate": 0.002869984674522021, "loss": 0.2235, "step": 3450 }, { "epoch": 0.09, "learning_rate": 0.002869607818506143, "loss": 0.2143, "step": 3460 }, { "epoch": 0.09, "learning_rate": 0.0028692309624902645, "loss": 0.2202, "step": 3470 }, { "epoch": 0.09, "learning_rate": 0.0028688541064743863, "loss": 0.2187, "step": 3480 }, { "epoch": 0.09, "learning_rate": 0.0028684772504585085, "loss": 0.2181, "step": 3490 }, { "epoch": 0.09, "learning_rate": 0.00286810039444263, "loss": 0.2206, "step": 3500 }, { "epoch": 0.09, "eval_cer": 0.668782636439627, "eval_loss": 0.1685170978307724, "eval_runtime": 90.6789, "eval_samples_per_second": 110.268, "eval_steps_per_second": 6.892, "step": 3500 }, { "epoch": 0.09, "learning_rate": 0.0028677235384267515, "loss": 0.2217, "step": 3510 }, { "epoch": 0.09, "learning_rate": 0.0028673466824108737, "loss": 0.2118, "step": 3520 }, { "epoch": 0.09, "learning_rate": 0.0028669698263949954, "loss": 0.2129, "step": 3530 }, { "epoch": 0.09, "learning_rate": 0.002866592970379117, "loss": 0.2189, "step": 3540 }, { "epoch": 0.09, "learning_rate": 0.002866216114363239, "loss": 0.2166, "step": 3550 }, { "epoch": 0.09, "learning_rate": 0.0028658392583473607, "loss": 0.2116, "step": 3560 }, { "epoch": 0.09, "learning_rate": 0.002865462402331483, "loss": 0.216, "step": 3570 }, { "epoch": 0.09, "learning_rate": 0.002865085546315604, "loss": 0.2173, "step": 3580 }, { "epoch": 0.09, "learning_rate": 0.0028647086902997263, "loss": 0.2213, "step": 3590 }, { "epoch": 0.09, "learning_rate": 0.002864331834283848, "loss": 0.213, "step": 3600 }, { "epoch": 0.09, "learning_rate": 0.00286395497826797, "loss": 0.2191, "step": 3610 }, { "epoch": 0.09, "learning_rate": 0.0028635781222520916, "loss": 0.2171, "step": 3620 }, { "epoch": 0.09, "learning_rate": 0.0028632012662362133, "loss": 0.2139, "step": 3630 }, { "epoch": 0.09, "learning_rate": 0.002862824410220335, "loss": 0.2152, "step": 3640 }, { "epoch": 0.09, "learning_rate": 0.0028624475542044572, "loss": 0.211, "step": 3650 }, { "epoch": 0.09, "learning_rate": 0.0028620706981885785, "loss": 0.2191, "step": 3660 }, { "epoch": 0.09, "learning_rate": 0.0028616938421727007, "loss": 0.2133, "step": 3670 }, { "epoch": 0.09, "learning_rate": 0.0028613169861568225, "loss": 0.2183, "step": 3680 }, { "epoch": 0.09, "learning_rate": 0.002860940130140944, "loss": 0.2118, "step": 3690 }, { "epoch": 0.09, "learning_rate": 0.002860563274125066, "loss": 0.2134, "step": 3700 }, { "epoch": 0.09, "learning_rate": 0.0028601864181091877, "loss": 0.2145, "step": 3710 }, { "epoch": 0.09, "learning_rate": 0.00285980956209331, "loss": 0.212, "step": 3720 }, { "epoch": 0.09, "learning_rate": 0.0028594327060774316, "loss": 0.2155, "step": 3730 }, { "epoch": 0.09, "learning_rate": 0.002859055850061553, "loss": 0.2131, "step": 3740 }, { "epoch": 0.09, "learning_rate": 0.002858678994045675, "loss": 0.2177, "step": 3750 }, { "epoch": 0.09, "learning_rate": 0.002858302138029797, "loss": 0.2219, "step": 3760 }, { "epoch": 0.09, "learning_rate": 0.0028579252820139186, "loss": 0.2193, "step": 3770 }, { "epoch": 0.09, "learning_rate": 0.0028575484259980403, "loss": 0.2107, "step": 3780 }, { "epoch": 0.1, "learning_rate": 0.002857171569982162, "loss": 0.2127, "step": 3790 }, { "epoch": 0.1, "learning_rate": 0.0028567947139662843, "loss": 0.2178, "step": 3800 }, { "epoch": 0.1, "learning_rate": 0.0028564178579504056, "loss": 0.2128, "step": 3810 }, { "epoch": 0.1, "learning_rate": 0.0028560410019345273, "loss": 0.2121, "step": 3820 }, { "epoch": 0.1, "learning_rate": 0.0028556641459186495, "loss": 0.2094, "step": 3830 }, { "epoch": 0.1, "learning_rate": 0.0028552872899027712, "loss": 0.2158, "step": 3840 }, { "epoch": 0.1, "learning_rate": 0.002854910433886893, "loss": 0.2161, "step": 3850 }, { "epoch": 0.1, "learning_rate": 0.0028545335778710147, "loss": 0.2145, "step": 3860 }, { "epoch": 0.1, "learning_rate": 0.0028541567218551365, "loss": 0.2089, "step": 3870 }, { "epoch": 0.1, "learning_rate": 0.0028537798658392587, "loss": 0.2088, "step": 3880 }, { "epoch": 0.1, "learning_rate": 0.00285340300982338, "loss": 0.2081, "step": 3890 }, { "epoch": 0.1, "learning_rate": 0.002853026153807502, "loss": 0.2111, "step": 3900 }, { "epoch": 0.1, "learning_rate": 0.002852649297791624, "loss": 0.2113, "step": 3910 }, { "epoch": 0.1, "learning_rate": 0.0028522724417757456, "loss": 0.2072, "step": 3920 }, { "epoch": 0.1, "learning_rate": 0.0028518955857598674, "loss": 0.2127, "step": 3930 }, { "epoch": 0.1, "learning_rate": 0.002851518729743989, "loss": 0.207, "step": 3940 }, { "epoch": 0.1, "learning_rate": 0.002851141873728111, "loss": 0.2079, "step": 3950 }, { "epoch": 0.1, "learning_rate": 0.002850765017712233, "loss": 0.2096, "step": 3960 }, { "epoch": 0.1, "learning_rate": 0.0028503881616963544, "loss": 0.2078, "step": 3970 }, { "epoch": 0.1, "learning_rate": 0.0028500113056804765, "loss": 0.2067, "step": 3980 }, { "epoch": 0.1, "learning_rate": 0.0028496344496645983, "loss": 0.2043, "step": 3990 }, { "epoch": 0.1, "learning_rate": 0.00284925759364872, "loss": 0.2086, "step": 4000 }, { "epoch": 0.1, "eval_cer": 0.6684727241053567, "eval_loss": 0.16068455576896667, "eval_runtime": 90.6058, "eval_samples_per_second": 110.357, "eval_steps_per_second": 6.898, "step": 4000 }, { "epoch": 0.1, "learning_rate": 0.0028488807376328418, "loss": 0.2033, "step": 4010 }, { "epoch": 0.1, "learning_rate": 0.0028485038816169635, "loss": 0.2086, "step": 4020 }, { "epoch": 0.1, "learning_rate": 0.0028481270256010857, "loss": 0.2048, "step": 4030 }, { "epoch": 0.1, "learning_rate": 0.002847750169585207, "loss": 0.2071, "step": 4040 }, { "epoch": 0.1, "learning_rate": 0.0028473733135693288, "loss": 0.2062, "step": 4050 }, { "epoch": 0.1, "learning_rate": 0.002846996457553451, "loss": 0.2096, "step": 4060 }, { "epoch": 0.1, "learning_rate": 0.0028466196015375727, "loss": 0.2108, "step": 4070 }, { "epoch": 0.1, "learning_rate": 0.0028462427455216944, "loss": 0.2058, "step": 4080 }, { "epoch": 0.1, "learning_rate": 0.002845865889505816, "loss": 0.2098, "step": 4090 }, { "epoch": 0.1, "learning_rate": 0.002845489033489938, "loss": 0.2044, "step": 4100 }, { "epoch": 0.1, "learning_rate": 0.00284511217747406, "loss": 0.2129, "step": 4110 }, { "epoch": 0.1, "learning_rate": 0.0028447353214581814, "loss": 0.2055, "step": 4120 }, { "epoch": 0.1, "learning_rate": 0.0028443584654423036, "loss": 0.2078, "step": 4130 }, { "epoch": 0.1, "learning_rate": 0.0028439816094264253, "loss": 0.2015, "step": 4140 }, { "epoch": 0.1, "learning_rate": 0.002843604753410547, "loss": 0.2001, "step": 4150 }, { "epoch": 0.1, "learning_rate": 0.002843227897394669, "loss": 0.2105, "step": 4160 }, { "epoch": 0.1, "learning_rate": 0.0028428510413787906, "loss": 0.2061, "step": 4170 }, { "epoch": 0.11, "learning_rate": 0.0028424741853629123, "loss": 0.2102, "step": 4180 }, { "epoch": 0.11, "learning_rate": 0.0028420973293470345, "loss": 0.2072, "step": 4190 }, { "epoch": 0.11, "learning_rate": 0.002841720473331156, "loss": 0.2004, "step": 4200 }, { "epoch": 0.11, "learning_rate": 0.002841343617315278, "loss": 0.2048, "step": 4210 }, { "epoch": 0.11, "learning_rate": 0.0028409667612993997, "loss": 0.2045, "step": 4220 }, { "epoch": 0.11, "learning_rate": 0.002840589905283521, "loss": 0.212, "step": 4230 }, { "epoch": 0.11, "learning_rate": 0.002840213049267643, "loss": 0.2036, "step": 4240 }, { "epoch": 0.11, "learning_rate": 0.002839836193251765, "loss": 0.2055, "step": 4250 }, { "epoch": 0.11, "learning_rate": 0.0028394593372358867, "loss": 0.2057, "step": 4260 }, { "epoch": 0.11, "learning_rate": 0.0028390824812200084, "loss": 0.202, "step": 4270 }, { "epoch": 0.11, "learning_rate": 0.00283870562520413, "loss": 0.2116, "step": 4280 }, { "epoch": 0.11, "learning_rate": 0.0028383287691882524, "loss": 0.2004, "step": 4290 }, { "epoch": 0.11, "learning_rate": 0.002837951913172374, "loss": 0.201, "step": 4300 }, { "epoch": 0.11, "learning_rate": 0.002837575057156496, "loss": 0.2058, "step": 4310 }, { "epoch": 0.11, "learning_rate": 0.0028371982011406176, "loss": 0.2019, "step": 4320 }, { "epoch": 0.11, "learning_rate": 0.0028368213451247393, "loss": 0.2054, "step": 4330 }, { "epoch": 0.11, "learning_rate": 0.0028364444891088615, "loss": 0.2049, "step": 4340 }, { "epoch": 0.11, "learning_rate": 0.002836067633092983, "loss": 0.2036, "step": 4350 }, { "epoch": 0.11, "learning_rate": 0.0028356907770771046, "loss": 0.1996, "step": 4360 }, { "epoch": 0.11, "learning_rate": 0.0028353139210612268, "loss": 0.2033, "step": 4370 }, { "epoch": 0.11, "learning_rate": 0.0028349370650453485, "loss": 0.2015, "step": 4380 }, { "epoch": 0.11, "learning_rate": 0.0028345602090294702, "loss": 0.1991, "step": 4390 }, { "epoch": 0.11, "learning_rate": 0.002834183353013592, "loss": 0.206, "step": 4400 }, { "epoch": 0.11, "learning_rate": 0.0028338064969977137, "loss": 0.2049, "step": 4410 }, { "epoch": 0.11, "learning_rate": 0.002833429640981836, "loss": 0.195, "step": 4420 }, { "epoch": 0.11, "learning_rate": 0.0028330527849659572, "loss": 0.1996, "step": 4430 }, { "epoch": 0.11, "learning_rate": 0.0028326759289500794, "loss": 0.1986, "step": 4440 }, { "epoch": 0.11, "learning_rate": 0.002832299072934201, "loss": 0.2058, "step": 4450 }, { "epoch": 0.11, "learning_rate": 0.0028319222169183225, "loss": 0.1988, "step": 4460 }, { "epoch": 0.11, "learning_rate": 0.0028315453609024446, "loss": 0.1954, "step": 4470 }, { "epoch": 0.11, "learning_rate": 0.0028311685048865664, "loss": 0.2005, "step": 4480 }, { "epoch": 0.11, "learning_rate": 0.002830791648870688, "loss": 0.1986, "step": 4490 }, { "epoch": 0.11, "learning_rate": 0.00283041479285481, "loss": 0.1955, "step": 4500 }, { "epoch": 0.11, "eval_cer": 0.6682609827589608, "eval_loss": 0.15178607404232025, "eval_runtime": 90.6612, "eval_samples_per_second": 110.29, "eval_steps_per_second": 6.894, "step": 4500 }, { "epoch": 0.11, "learning_rate": 0.0028300379368389316, "loss": 0.1974, "step": 4510 }, { "epoch": 0.11, "learning_rate": 0.002829661080823054, "loss": 0.1988, "step": 4520 }, { "epoch": 0.11, "learning_rate": 0.0028292842248071755, "loss": 0.2004, "step": 4530 }, { "epoch": 0.11, "learning_rate": 0.0028289073687912973, "loss": 0.1999, "step": 4540 }, { "epoch": 0.11, "learning_rate": 0.002828530512775419, "loss": 0.1944, "step": 4550 }, { "epoch": 0.11, "learning_rate": 0.0028281536567595408, "loss": 0.1953, "step": 4560 }, { "epoch": 0.11, "learning_rate": 0.0028277768007436625, "loss": 0.2002, "step": 4570 }, { "epoch": 0.12, "learning_rate": 0.0028273999447277843, "loss": 0.1997, "step": 4580 }, { "epoch": 0.12, "learning_rate": 0.002827023088711906, "loss": 0.201, "step": 4590 }, { "epoch": 0.12, "learning_rate": 0.002826646232696028, "loss": 0.2003, "step": 4600 }, { "epoch": 0.12, "learning_rate": 0.00282626937668015, "loss": 0.2066, "step": 4610 }, { "epoch": 0.12, "learning_rate": 0.0028258925206642717, "loss": 0.1923, "step": 4620 }, { "epoch": 0.12, "learning_rate": 0.0028255156646483934, "loss": 0.199, "step": 4630 }, { "epoch": 0.12, "learning_rate": 0.002825138808632515, "loss": 0.1977, "step": 4640 }, { "epoch": 0.12, "learning_rate": 0.0028247619526166373, "loss": 0.1968, "step": 4650 }, { "epoch": 0.12, "learning_rate": 0.0028243850966007586, "loss": 0.1967, "step": 4660 }, { "epoch": 0.12, "learning_rate": 0.0028240082405848804, "loss": 0.2042, "step": 4670 }, { "epoch": 0.12, "learning_rate": 0.0028236313845690026, "loss": 0.2012, "step": 4680 }, { "epoch": 0.12, "learning_rate": 0.002823254528553124, "loss": 0.1981, "step": 4690 }, { "epoch": 0.12, "learning_rate": 0.002822877672537246, "loss": 0.1926, "step": 4700 }, { "epoch": 0.12, "learning_rate": 0.002822500816521368, "loss": 0.1958, "step": 4710 }, { "epoch": 0.12, "learning_rate": 0.0028221239605054895, "loss": 0.1916, "step": 4720 }, { "epoch": 0.12, "learning_rate": 0.0028217471044896113, "loss": 0.2, "step": 4730 }, { "epoch": 0.12, "learning_rate": 0.002821370248473733, "loss": 0.1958, "step": 4740 }, { "epoch": 0.12, "learning_rate": 0.002820993392457855, "loss": 0.1976, "step": 4750 }, { "epoch": 0.12, "learning_rate": 0.002820616536441977, "loss": 0.1966, "step": 4760 }, { "epoch": 0.12, "learning_rate": 0.0028202396804260983, "loss": 0.1917, "step": 4770 }, { "epoch": 0.12, "learning_rate": 0.0028198628244102204, "loss": 0.2017, "step": 4780 }, { "epoch": 0.12, "learning_rate": 0.002819485968394342, "loss": 0.1975, "step": 4790 }, { "epoch": 0.12, "learning_rate": 0.002819109112378464, "loss": 0.1965, "step": 4800 }, { "epoch": 0.12, "learning_rate": 0.0028187322563625857, "loss": 0.1967, "step": 4810 }, { "epoch": 0.12, "learning_rate": 0.0028183554003467074, "loss": 0.2022, "step": 4820 }, { "epoch": 0.12, "learning_rate": 0.0028179785443308296, "loss": 0.1958, "step": 4830 }, { "epoch": 0.12, "learning_rate": 0.0028176016883149513, "loss": 0.1923, "step": 4840 }, { "epoch": 0.12, "learning_rate": 0.002817224832299073, "loss": 0.2005, "step": 4850 }, { "epoch": 0.12, "learning_rate": 0.002816847976283195, "loss": 0.1913, "step": 4860 }, { "epoch": 0.12, "learning_rate": 0.0028164711202673166, "loss": 0.1938, "step": 4870 }, { "epoch": 0.12, "learning_rate": 0.0028160942642514388, "loss": 0.1997, "step": 4880 }, { "epoch": 0.12, "learning_rate": 0.00281571740823556, "loss": 0.1955, "step": 4890 }, { "epoch": 0.12, "learning_rate": 0.002815340552219682, "loss": 0.1907, "step": 4900 }, { "epoch": 0.12, "learning_rate": 0.002814963696203804, "loss": 0.1961, "step": 4910 }, { "epoch": 0.12, "learning_rate": 0.0028145868401879253, "loss": 0.1959, "step": 4920 }, { "epoch": 0.12, "learning_rate": 0.0028142099841720475, "loss": 0.1943, "step": 4930 }, { "epoch": 0.12, "learning_rate": 0.0028138331281561692, "loss": 0.1934, "step": 4940 }, { "epoch": 0.12, "learning_rate": 0.002813456272140291, "loss": 0.2008, "step": 4950 }, { "epoch": 0.12, "learning_rate": 0.0028130794161244127, "loss": 0.1866, "step": 4960 }, { "epoch": 0.12, "learning_rate": 0.0028127025601085345, "loss": 0.197, "step": 4970 }, { "epoch": 0.13, "learning_rate": 0.002812325704092656, "loss": 0.1916, "step": 4980 }, { "epoch": 0.13, "learning_rate": 0.0028119488480767784, "loss": 0.1928, "step": 4990 }, { "epoch": 0.13, "learning_rate": 0.0028115719920608997, "loss": 0.1903, "step": 5000 }, { "epoch": 0.13, "eval_cer": 0.6685646390989058, "eval_loss": 0.14745888113975525, "eval_runtime": 90.6922, "eval_samples_per_second": 110.252, "eval_steps_per_second": 6.891, "step": 5000 }, { "epoch": 0.13, "learning_rate": 0.002811195136045022, "loss": 0.1923, "step": 5010 }, { "epoch": 0.13, "learning_rate": 0.0028108182800291436, "loss": 0.1937, "step": 5020 }, { "epoch": 0.13, "learning_rate": 0.0028104414240132654, "loss": 0.1935, "step": 5030 }, { "epoch": 0.13, "learning_rate": 0.002810064567997387, "loss": 0.1921, "step": 5040 }, { "epoch": 0.13, "learning_rate": 0.002809687711981509, "loss": 0.1966, "step": 5050 }, { "epoch": 0.13, "learning_rate": 0.002809310855965631, "loss": 0.1934, "step": 5060 }, { "epoch": 0.13, "learning_rate": 0.0028089339999497528, "loss": 0.1895, "step": 5070 }, { "epoch": 0.13, "learning_rate": 0.002808557143933874, "loss": 0.194, "step": 5080 }, { "epoch": 0.13, "learning_rate": 0.0028081802879179963, "loss": 0.1948, "step": 5090 }, { "epoch": 0.13, "learning_rate": 0.002807803431902118, "loss": 0.1917, "step": 5100 }, { "epoch": 0.13, "learning_rate": 0.0028074265758862398, "loss": 0.1955, "step": 5110 }, { "epoch": 0.13, "learning_rate": 0.0028070497198703615, "loss": 0.189, "step": 5120 }, { "epoch": 0.13, "learning_rate": 0.0028066728638544832, "loss": 0.1943, "step": 5130 }, { "epoch": 0.13, "learning_rate": 0.0028062960078386054, "loss": 0.1898, "step": 5140 }, { "epoch": 0.13, "learning_rate": 0.0028059191518227267, "loss": 0.1896, "step": 5150 }, { "epoch": 0.13, "learning_rate": 0.002805542295806849, "loss": 0.1919, "step": 5160 }, { "epoch": 0.13, "learning_rate": 0.0028051654397909707, "loss": 0.1935, "step": 5170 }, { "epoch": 0.13, "learning_rate": 0.0028047885837750924, "loss": 0.1876, "step": 5180 }, { "epoch": 0.13, "learning_rate": 0.002804411727759214, "loss": 0.1914, "step": 5190 }, { "epoch": 0.13, "learning_rate": 0.002804034871743336, "loss": 0.1891, "step": 5200 }, { "epoch": 0.13, "learning_rate": 0.0028036580157274576, "loss": 0.1908, "step": 5210 }, { "epoch": 0.13, "learning_rate": 0.00280328115971158, "loss": 0.1893, "step": 5220 }, { "epoch": 0.13, "learning_rate": 0.002802904303695701, "loss": 0.1848, "step": 5230 }, { "epoch": 0.13, "learning_rate": 0.0028025274476798233, "loss": 0.1922, "step": 5240 }, { "epoch": 0.13, "learning_rate": 0.002802150591663945, "loss": 0.1921, "step": 5250 }, { "epoch": 0.13, "learning_rate": 0.002801773735648067, "loss": 0.1927, "step": 5260 }, { "epoch": 0.13, "learning_rate": 0.0028013968796321885, "loss": 0.191, "step": 5270 }, { "epoch": 0.13, "learning_rate": 0.0028010200236163103, "loss": 0.1963, "step": 5280 }, { "epoch": 0.13, "learning_rate": 0.0028006431676004325, "loss": 0.1873, "step": 5290 }, { "epoch": 0.13, "learning_rate": 0.002800266311584554, "loss": 0.1908, "step": 5300 }, { "epoch": 0.13, "learning_rate": 0.0027998894555686755, "loss": 0.1866, "step": 5310 }, { "epoch": 0.13, "learning_rate": 0.0027995125995527977, "loss": 0.1935, "step": 5320 }, { "epoch": 0.13, "learning_rate": 0.0027991357435369194, "loss": 0.1892, "step": 5330 }, { "epoch": 0.13, "learning_rate": 0.002798758887521041, "loss": 0.1894, "step": 5340 }, { "epoch": 0.13, "learning_rate": 0.002798382031505163, "loss": 0.1812, "step": 5350 }, { "epoch": 0.13, "learning_rate": 0.0027980051754892847, "loss": 0.1868, "step": 5360 }, { "epoch": 0.13, "learning_rate": 0.002797628319473407, "loss": 0.1905, "step": 5370 }, { "epoch": 0.14, "learning_rate": 0.002797251463457528, "loss": 0.191, "step": 5380 }, { "epoch": 0.14, "learning_rate": 0.00279687460744165, "loss": 0.192, "step": 5390 }, { "epoch": 0.14, "learning_rate": 0.002796497751425772, "loss": 0.1865, "step": 5400 }, { "epoch": 0.14, "learning_rate": 0.002796120895409894, "loss": 0.1868, "step": 5410 }, { "epoch": 0.14, "learning_rate": 0.0027957440393940156, "loss": 0.184, "step": 5420 }, { "epoch": 0.14, "learning_rate": 0.0027953671833781373, "loss": 0.1909, "step": 5430 }, { "epoch": 0.14, "learning_rate": 0.002794990327362259, "loss": 0.1797, "step": 5440 }, { "epoch": 0.14, "learning_rate": 0.0027946134713463812, "loss": 0.1846, "step": 5450 }, { "epoch": 0.14, "learning_rate": 0.0027942366153305026, "loss": 0.1869, "step": 5460 }, { "epoch": 0.14, "learning_rate": 0.0027938597593146247, "loss": 0.1831, "step": 5470 }, { "epoch": 0.14, "learning_rate": 0.0027934829032987465, "loss": 0.1836, "step": 5480 }, { "epoch": 0.14, "learning_rate": 0.0027931060472828682, "loss": 0.1878, "step": 5490 }, { "epoch": 0.14, "learning_rate": 0.00279272919126699, "loss": 0.1827, "step": 5500 }, { "epoch": 0.14, "eval_cer": 0.6683553039041735, "eval_loss": 0.14301101863384247, "eval_runtime": 90.7398, "eval_samples_per_second": 110.194, "eval_steps_per_second": 6.888, "step": 5500 }, { "epoch": 0.14, "learning_rate": 0.0027923523352511117, "loss": 0.1803, "step": 5510 }, { "epoch": 0.14, "learning_rate": 0.0027919754792352335, "loss": 0.1819, "step": 5520 }, { "epoch": 0.14, "learning_rate": 0.0027915986232193556, "loss": 0.1879, "step": 5530 }, { "epoch": 0.14, "learning_rate": 0.002791221767203477, "loss": 0.1881, "step": 5540 }, { "epoch": 0.14, "learning_rate": 0.002790844911187599, "loss": 0.1878, "step": 5550 }, { "epoch": 0.14, "learning_rate": 0.002790468055171721, "loss": 0.1852, "step": 5560 }, { "epoch": 0.14, "learning_rate": 0.0027900911991558426, "loss": 0.1871, "step": 5570 }, { "epoch": 0.14, "learning_rate": 0.0027897143431399644, "loss": 0.184, "step": 5580 }, { "epoch": 0.14, "learning_rate": 0.002789337487124086, "loss": 0.1865, "step": 5590 }, { "epoch": 0.14, "learning_rate": 0.0027889606311082083, "loss": 0.1845, "step": 5600 }, { "epoch": 0.14, "learning_rate": 0.0027885837750923296, "loss": 0.1866, "step": 5610 }, { "epoch": 0.14, "learning_rate": 0.0027882069190764513, "loss": 0.185, "step": 5620 }, { "epoch": 0.14, "learning_rate": 0.0027878300630605735, "loss": 0.1838, "step": 5630 }, { "epoch": 0.14, "learning_rate": 0.0027874532070446953, "loss": 0.1822, "step": 5640 }, { "epoch": 0.14, "learning_rate": 0.002787076351028817, "loss": 0.1854, "step": 5650 }, { "epoch": 0.14, "learning_rate": 0.0027866994950129387, "loss": 0.1828, "step": 5660 }, { "epoch": 0.14, "learning_rate": 0.0027863226389970605, "loss": 0.1816, "step": 5670 }, { "epoch": 0.14, "learning_rate": 0.0027859457829811827, "loss": 0.1771, "step": 5680 }, { "epoch": 0.14, "learning_rate": 0.002785568926965304, "loss": 0.1881, "step": 5690 }, { "epoch": 0.14, "learning_rate": 0.002785192070949426, "loss": 0.1787, "step": 5700 }, { "epoch": 0.14, "learning_rate": 0.002784815214933548, "loss": 0.1839, "step": 5710 }, { "epoch": 0.14, "learning_rate": 0.0027844383589176696, "loss": 0.1817, "step": 5720 }, { "epoch": 0.14, "learning_rate": 0.0027840615029017914, "loss": 0.1831, "step": 5730 }, { "epoch": 0.14, "learning_rate": 0.002783684646885913, "loss": 0.1844, "step": 5740 }, { "epoch": 0.14, "learning_rate": 0.002783307790870035, "loss": 0.1846, "step": 5750 }, { "epoch": 0.14, "learning_rate": 0.002782930934854157, "loss": 0.1784, "step": 5760 }, { "epoch": 0.14, "learning_rate": 0.0027825540788382784, "loss": 0.1817, "step": 5770 }, { "epoch": 0.15, "learning_rate": 0.0027821772228224005, "loss": 0.1807, "step": 5780 }, { "epoch": 0.15, "learning_rate": 0.0027818003668065223, "loss": 0.1805, "step": 5790 }, { "epoch": 0.15, "learning_rate": 0.0027814235107906436, "loss": 0.1813, "step": 5800 }, { "epoch": 0.15, "learning_rate": 0.0027810466547747658, "loss": 0.1821, "step": 5810 }, { "epoch": 0.15, "learning_rate": 0.0027806697987588875, "loss": 0.1809, "step": 5820 }, { "epoch": 0.15, "learning_rate": 0.0027802929427430093, "loss": 0.1834, "step": 5830 }, { "epoch": 0.15, "learning_rate": 0.002779916086727131, "loss": 0.1811, "step": 5840 }, { "epoch": 0.15, "learning_rate": 0.0027795392307112528, "loss": 0.1823, "step": 5850 }, { "epoch": 0.15, "learning_rate": 0.002779162374695375, "loss": 0.1896, "step": 5860 }, { "epoch": 0.15, "learning_rate": 0.0027787855186794967, "loss": 0.1767, "step": 5870 }, { "epoch": 0.15, "learning_rate": 0.0027784086626636184, "loss": 0.1821, "step": 5880 }, { "epoch": 0.15, "learning_rate": 0.00277803180664774, "loss": 0.1769, "step": 5890 }, { "epoch": 0.15, "learning_rate": 0.002777654950631862, "loss": 0.185, "step": 5900 }, { "epoch": 0.15, "learning_rate": 0.002777278094615984, "loss": 0.1842, "step": 5910 }, { "epoch": 0.15, "learning_rate": 0.0027769012386001054, "loss": 0.1786, "step": 5920 }, { "epoch": 0.15, "learning_rate": 0.002776524382584227, "loss": 0.1771, "step": 5930 }, { "epoch": 0.15, "learning_rate": 0.0027761475265683493, "loss": 0.1717, "step": 5940 }, { "epoch": 0.15, "learning_rate": 0.002775770670552471, "loss": 0.1858, "step": 5950 }, { "epoch": 0.15, "learning_rate": 0.002775393814536593, "loss": 0.1809, "step": 5960 }, { "epoch": 0.15, "learning_rate": 0.0027750169585207146, "loss": 0.1767, "step": 5970 }, { "epoch": 0.15, "learning_rate": 0.0027746401025048363, "loss": 0.179, "step": 5980 }, { "epoch": 0.15, "learning_rate": 0.0027742632464889585, "loss": 0.1799, "step": 5990 }, { "epoch": 0.15, "learning_rate": 0.00277388639047308, "loss": 0.1775, "step": 6000 }, { "epoch": 0.15, "eval_cer": 0.6680800401538589, "eval_loss": 0.13693051040172577, "eval_runtime": 90.8542, "eval_samples_per_second": 110.055, "eval_steps_per_second": 6.879, "step": 6000 }, { "epoch": 0.15, "learning_rate": 0.002773509534457202, "loss": 0.1767, "step": 6010 }, { "epoch": 0.15, "learning_rate": 0.0027731326784413237, "loss": 0.1782, "step": 6020 }, { "epoch": 0.15, "learning_rate": 0.002772755822425445, "loss": 0.1818, "step": 6030 }, { "epoch": 0.15, "learning_rate": 0.002772378966409567, "loss": 0.1827, "step": 6040 }, { "epoch": 0.15, "learning_rate": 0.002772002110393689, "loss": 0.1795, "step": 6050 }, { "epoch": 0.15, "learning_rate": 0.0027716252543778107, "loss": 0.1785, "step": 6060 }, { "epoch": 0.15, "learning_rate": 0.0027712483983619324, "loss": 0.1761, "step": 6070 }, { "epoch": 0.15, "learning_rate": 0.002770871542346054, "loss": 0.1768, "step": 6080 }, { "epoch": 0.15, "learning_rate": 0.0027704946863301764, "loss": 0.1788, "step": 6090 }, { "epoch": 0.15, "learning_rate": 0.002770117830314298, "loss": 0.18, "step": 6100 }, { "epoch": 0.15, "learning_rate": 0.00276974097429842, "loss": 0.1763, "step": 6110 }, { "epoch": 0.15, "learning_rate": 0.0027693641182825416, "loss": 0.1843, "step": 6120 }, { "epoch": 0.15, "learning_rate": 0.0027689872622666633, "loss": 0.1754, "step": 6130 }, { "epoch": 0.15, "learning_rate": 0.0027686104062507855, "loss": 0.1811, "step": 6140 }, { "epoch": 0.15, "learning_rate": 0.002768233550234907, "loss": 0.181, "step": 6150 }, { "epoch": 0.15, "learning_rate": 0.0027678566942190286, "loss": 0.1804, "step": 6160 }, { "epoch": 0.16, "learning_rate": 0.0027674798382031508, "loss": 0.1789, "step": 6170 }, { "epoch": 0.16, "learning_rate": 0.0027671029821872725, "loss": 0.181, "step": 6180 }, { "epoch": 0.16, "learning_rate": 0.0027667261261713942, "loss": 0.1832, "step": 6190 }, { "epoch": 0.16, "learning_rate": 0.002766349270155516, "loss": 0.1808, "step": 6200 }, { "epoch": 0.16, "learning_rate": 0.0027659724141396377, "loss": 0.1828, "step": 6210 }, { "epoch": 0.16, "learning_rate": 0.00276559555812376, "loss": 0.1813, "step": 6220 }, { "epoch": 0.16, "learning_rate": 0.0027652187021078812, "loss": 0.1782, "step": 6230 }, { "epoch": 0.16, "learning_rate": 0.002764841846092003, "loss": 0.1724, "step": 6240 }, { "epoch": 0.16, "learning_rate": 0.002764464990076125, "loss": 0.1748, "step": 6250 }, { "epoch": 0.16, "learning_rate": 0.0027640881340602465, "loss": 0.1731, "step": 6260 }, { "epoch": 0.16, "learning_rate": 0.0027637112780443686, "loss": 0.177, "step": 6270 }, { "epoch": 0.16, "learning_rate": 0.0027633344220284904, "loss": 0.175, "step": 6280 }, { "epoch": 0.16, "learning_rate": 0.002762957566012612, "loss": 0.1784, "step": 6290 }, { "epoch": 0.16, "learning_rate": 0.002762580709996734, "loss": 0.1754, "step": 6300 }, { "epoch": 0.16, "learning_rate": 0.0027622038539808556, "loss": 0.1801, "step": 6310 }, { "epoch": 0.16, "learning_rate": 0.002761826997964978, "loss": 0.175, "step": 6320 }, { "epoch": 0.16, "learning_rate": 0.0027614501419490995, "loss": 0.1724, "step": 6330 }, { "epoch": 0.16, "learning_rate": 0.002761073285933221, "loss": 0.1784, "step": 6340 }, { "epoch": 0.16, "learning_rate": 0.002760696429917343, "loss": 0.1811, "step": 6350 }, { "epoch": 0.16, "learning_rate": 0.0027603195739014648, "loss": 0.1784, "step": 6360 }, { "epoch": 0.16, "learning_rate": 0.0027599427178855865, "loss": 0.1747, "step": 6370 }, { "epoch": 0.16, "learning_rate": 0.0027595658618697083, "loss": 0.1711, "step": 6380 }, { "epoch": 0.16, "learning_rate": 0.00275918900585383, "loss": 0.1755, "step": 6390 }, { "epoch": 0.16, "learning_rate": 0.002758812149837952, "loss": 0.175, "step": 6400 }, { "epoch": 0.16, "learning_rate": 0.002758435293822074, "loss": 0.1723, "step": 6410 }, { "epoch": 0.16, "learning_rate": 0.0027580584378061957, "loss": 0.1707, "step": 6420 }, { "epoch": 0.16, "learning_rate": 0.0027576815817903174, "loss": 0.1744, "step": 6430 }, { "epoch": 0.16, "learning_rate": 0.002757304725774439, "loss": 0.1719, "step": 6440 }, { "epoch": 0.16, "learning_rate": 0.0027569278697585613, "loss": 0.1782, "step": 6450 }, { "epoch": 0.16, "learning_rate": 0.0027565510137426827, "loss": 0.1684, "step": 6460 }, { "epoch": 0.16, "learning_rate": 0.0027561741577268044, "loss": 0.171, "step": 6470 }, { "epoch": 0.16, "learning_rate": 0.0027557973017109266, "loss": 0.1759, "step": 6480 }, { "epoch": 0.16, "learning_rate": 0.002755420445695048, "loss": 0.1723, "step": 6490 }, { "epoch": 0.16, "learning_rate": 0.00275504358967917, "loss": 0.1748, "step": 6500 }, { "epoch": 0.16, "eval_cer": 0.6680973644458368, "eval_loss": 0.13586829602718353, "eval_runtime": 90.7366, "eval_samples_per_second": 110.198, "eval_steps_per_second": 6.888, "step": 6500 }, { "epoch": 0.16, "learning_rate": 0.002754666733663292, "loss": 0.1766, "step": 6510 }, { "epoch": 0.16, "learning_rate": 0.0027542898776474136, "loss": 0.1798, "step": 6520 }, { "epoch": 0.16, "learning_rate": 0.0027539130216315353, "loss": 0.1747, "step": 6530 }, { "epoch": 0.16, "learning_rate": 0.002753536165615657, "loss": 0.1724, "step": 6540 }, { "epoch": 0.16, "learning_rate": 0.0027531593095997792, "loss": 0.1781, "step": 6550 }, { "epoch": 0.16, "learning_rate": 0.002752782453583901, "loss": 0.1793, "step": 6560 }, { "epoch": 0.17, "learning_rate": 0.0027524055975680223, "loss": 0.1741, "step": 6570 }, { "epoch": 0.17, "learning_rate": 0.0027520287415521445, "loss": 0.1745, "step": 6580 }, { "epoch": 0.17, "learning_rate": 0.002751651885536266, "loss": 0.1749, "step": 6590 }, { "epoch": 0.17, "learning_rate": 0.002751275029520388, "loss": 0.1789, "step": 6600 }, { "epoch": 0.17, "learning_rate": 0.0027508981735045097, "loss": 0.1792, "step": 6610 }, { "epoch": 0.17, "learning_rate": 0.0027505213174886314, "loss": 0.1773, "step": 6620 }, { "epoch": 0.17, "learning_rate": 0.0027501444614727536, "loss": 0.1733, "step": 6630 }, { "epoch": 0.17, "learning_rate": 0.0027497676054568754, "loss": 0.1701, "step": 6640 }, { "epoch": 0.17, "learning_rate": 0.0027493907494409967, "loss": 0.1755, "step": 6650 }, { "epoch": 0.17, "learning_rate": 0.002749013893425119, "loss": 0.1711, "step": 6660 }, { "epoch": 0.17, "learning_rate": 0.0027486370374092406, "loss": 0.1697, "step": 6670 }, { "epoch": 0.17, "learning_rate": 0.0027482601813933623, "loss": 0.1697, "step": 6680 }, { "epoch": 0.17, "learning_rate": 0.002747883325377484, "loss": 0.1699, "step": 6690 }, { "epoch": 0.17, "learning_rate": 0.002747506469361606, "loss": 0.1709, "step": 6700 }, { "epoch": 0.17, "learning_rate": 0.002747129613345728, "loss": 0.1693, "step": 6710 }, { "epoch": 0.17, "learning_rate": 0.0027467527573298493, "loss": 0.1742, "step": 6720 }, { "epoch": 0.17, "learning_rate": 0.0027463759013139715, "loss": 0.1763, "step": 6730 }, { "epoch": 0.17, "learning_rate": 0.0027459990452980932, "loss": 0.1661, "step": 6740 }, { "epoch": 0.17, "learning_rate": 0.002745622189282215, "loss": 0.167, "step": 6750 }, { "epoch": 0.17, "learning_rate": 0.0027452453332663367, "loss": 0.1745, "step": 6760 }, { "epoch": 0.17, "learning_rate": 0.0027448684772504585, "loss": 0.1694, "step": 6770 }, { "epoch": 0.17, "learning_rate": 0.00274449162123458, "loss": 0.1685, "step": 6780 }, { "epoch": 0.17, "learning_rate": 0.0027441147652187024, "loss": 0.1706, "step": 6790 }, { "epoch": 0.17, "learning_rate": 0.0027437379092028237, "loss": 0.1723, "step": 6800 }, { "epoch": 0.17, "learning_rate": 0.002743361053186946, "loss": 0.1669, "step": 6810 }, { "epoch": 0.17, "learning_rate": 0.0027429841971710676, "loss": 0.1722, "step": 6820 }, { "epoch": 0.17, "learning_rate": 0.0027426073411551894, "loss": 0.1665, "step": 6830 }, { "epoch": 0.17, "learning_rate": 0.002742230485139311, "loss": 0.1748, "step": 6840 }, { "epoch": 0.17, "learning_rate": 0.002741853629123433, "loss": 0.1727, "step": 6850 }, { "epoch": 0.17, "learning_rate": 0.002741476773107555, "loss": 0.1731, "step": 6860 }, { "epoch": 0.17, "learning_rate": 0.002741099917091677, "loss": 0.1707, "step": 6870 }, { "epoch": 0.17, "learning_rate": 0.002740723061075798, "loss": 0.1672, "step": 6880 }, { "epoch": 0.17, "learning_rate": 0.0027403462050599203, "loss": 0.1678, "step": 6890 }, { "epoch": 0.17, "learning_rate": 0.002739969349044042, "loss": 0.1673, "step": 6900 }, { "epoch": 0.17, "learning_rate": 0.0027395924930281638, "loss": 0.181, "step": 6910 }, { "epoch": 0.17, "learning_rate": 0.0027392156370122855, "loss": 0.1734, "step": 6920 }, { "epoch": 0.17, "learning_rate": 0.0027388387809964073, "loss": 0.1664, "step": 6930 }, { "epoch": 0.17, "learning_rate": 0.0027384619249805294, "loss": 0.1695, "step": 6940 }, { "epoch": 0.17, "learning_rate": 0.0027380850689646507, "loss": 0.1669, "step": 6950 }, { "epoch": 0.17, "learning_rate": 0.0027377082129487725, "loss": 0.168, "step": 6960 }, { "epoch": 0.18, "learning_rate": 0.0027373313569328947, "loss": 0.1689, "step": 6970 }, { "epoch": 0.18, "learning_rate": 0.0027369545009170164, "loss": 0.1741, "step": 6980 }, { "epoch": 0.18, "learning_rate": 0.002736577644901138, "loss": 0.169, "step": 6990 }, { "epoch": 0.18, "learning_rate": 0.00273620078888526, "loss": 0.1725, "step": 7000 }, { "epoch": 0.18, "eval_cer": 0.6677037180336736, "eval_loss": 0.1311553418636322, "eval_runtime": 90.7293, "eval_samples_per_second": 110.207, "eval_steps_per_second": 6.889, "step": 7000 }, { "epoch": 0.18, "learning_rate": 0.0027358239328693816, "loss": 0.165, "step": 7010 }, { "epoch": 0.18, "learning_rate": 0.002735447076853504, "loss": 0.1721, "step": 7020 }, { "epoch": 0.18, "learning_rate": 0.002735070220837625, "loss": 0.1703, "step": 7030 }, { "epoch": 0.18, "learning_rate": 0.0027346933648217473, "loss": 0.1648, "step": 7040 }, { "epoch": 0.18, "learning_rate": 0.002734316508805869, "loss": 0.1708, "step": 7050 }, { "epoch": 0.18, "learning_rate": 0.002733939652789991, "loss": 0.1714, "step": 7060 }, { "epoch": 0.18, "learning_rate": 0.0027335627967741125, "loss": 0.1664, "step": 7070 }, { "epoch": 0.18, "learning_rate": 0.0027331859407582343, "loss": 0.1664, "step": 7080 }, { "epoch": 0.18, "learning_rate": 0.002732809084742356, "loss": 0.1704, "step": 7090 }, { "epoch": 0.18, "learning_rate": 0.002732432228726478, "loss": 0.1641, "step": 7100 }, { "epoch": 0.18, "learning_rate": 0.0027320553727105995, "loss": 0.1701, "step": 7110 }, { "epoch": 0.18, "learning_rate": 0.0027316785166947217, "loss": 0.1656, "step": 7120 }, { "epoch": 0.18, "learning_rate": 0.0027313016606788434, "loss": 0.1751, "step": 7130 }, { "epoch": 0.18, "learning_rate": 0.002730924804662965, "loss": 0.1656, "step": 7140 }, { "epoch": 0.18, "learning_rate": 0.002730547948647087, "loss": 0.1692, "step": 7150 }, { "epoch": 0.18, "learning_rate": 0.0027301710926312087, "loss": 0.1725, "step": 7160 }, { "epoch": 0.18, "learning_rate": 0.002729794236615331, "loss": 0.174, "step": 7170 }, { "epoch": 0.18, "learning_rate": 0.002729417380599452, "loss": 0.1702, "step": 7180 }, { "epoch": 0.18, "learning_rate": 0.002729040524583574, "loss": 0.1714, "step": 7190 }, { "epoch": 0.18, "learning_rate": 0.002728663668567696, "loss": 0.1688, "step": 7200 }, { "epoch": 0.18, "learning_rate": 0.002728286812551818, "loss": 0.1692, "step": 7210 }, { "epoch": 0.18, "learning_rate": 0.0027279099565359396, "loss": 0.1651, "step": 7220 }, { "epoch": 0.18, "learning_rate": 0.0027275331005200613, "loss": 0.1707, "step": 7230 }, { "epoch": 0.18, "learning_rate": 0.002727156244504183, "loss": 0.1701, "step": 7240 }, { "epoch": 0.18, "learning_rate": 0.0027267793884883052, "loss": 0.1677, "step": 7250 }, { "epoch": 0.18, "learning_rate": 0.0027264025324724266, "loss": 0.1681, "step": 7260 }, { "epoch": 0.18, "learning_rate": 0.0027260256764565487, "loss": 0.1704, "step": 7270 }, { "epoch": 0.18, "learning_rate": 0.0027256488204406705, "loss": 0.1638, "step": 7280 }, { "epoch": 0.18, "learning_rate": 0.0027252719644247922, "loss": 0.1685, "step": 7290 }, { "epoch": 0.18, "learning_rate": 0.002724895108408914, "loss": 0.1696, "step": 7300 }, { "epoch": 0.18, "learning_rate": 0.0027245182523930357, "loss": 0.1719, "step": 7310 }, { "epoch": 0.18, "learning_rate": 0.0027241413963771575, "loss": 0.1699, "step": 7320 }, { "epoch": 0.18, "learning_rate": 0.0027237645403612796, "loss": 0.1745, "step": 7330 }, { "epoch": 0.18, "learning_rate": 0.002723387684345401, "loss": 0.1663, "step": 7340 }, { "epoch": 0.18, "learning_rate": 0.002723010828329523, "loss": 0.1715, "step": 7350 }, { "epoch": 0.18, "learning_rate": 0.002722633972313645, "loss": 0.1624, "step": 7360 }, { "epoch": 0.19, "learning_rate": 0.002722257116297766, "loss": 0.1615, "step": 7370 }, { "epoch": 0.19, "learning_rate": 0.0027218802602818884, "loss": 0.1689, "step": 7380 }, { "epoch": 0.19, "learning_rate": 0.00272150340426601, "loss": 0.1653, "step": 7390 }, { "epoch": 0.19, "learning_rate": 0.002721126548250132, "loss": 0.1636, "step": 7400 }, { "epoch": 0.19, "learning_rate": 0.0027207496922342536, "loss": 0.1663, "step": 7410 }, { "epoch": 0.19, "learning_rate": 0.0027203728362183753, "loss": 0.1667, "step": 7420 }, { "epoch": 0.19, "learning_rate": 0.0027199959802024975, "loss": 0.1652, "step": 7430 }, { "epoch": 0.19, "learning_rate": 0.0027196191241866193, "loss": 0.1632, "step": 7440 }, { "epoch": 0.19, "learning_rate": 0.002719242268170741, "loss": 0.1662, "step": 7450 }, { "epoch": 0.19, "learning_rate": 0.0027188654121548628, "loss": 0.1704, "step": 7460 }, { "epoch": 0.19, "learning_rate": 0.0027184885561389845, "loss": 0.1654, "step": 7470 }, { "epoch": 0.19, "learning_rate": 0.0027181117001231067, "loss": 0.1664, "step": 7480 }, { "epoch": 0.19, "learning_rate": 0.002717734844107228, "loss": 0.1684, "step": 7490 }, { "epoch": 0.19, "learning_rate": 0.0027173579880913497, "loss": 0.1638, "step": 7500 }, { "epoch": 0.19, "eval_cer": 0.6673577134244495, "eval_loss": 0.12540632486343384, "eval_runtime": 90.7183, "eval_samples_per_second": 110.22, "eval_steps_per_second": 6.889, "step": 7500 }, { "epoch": 0.19, "learning_rate": 0.002716981132075472, "loss": 0.1615, "step": 7510 }, { "epoch": 0.19, "learning_rate": 0.0027166042760595937, "loss": 0.1672, "step": 7520 }, { "epoch": 0.19, "learning_rate": 0.0027162274200437154, "loss": 0.1614, "step": 7530 }, { "epoch": 0.19, "learning_rate": 0.002715850564027837, "loss": 0.1683, "step": 7540 }, { "epoch": 0.19, "learning_rate": 0.002715473708011959, "loss": 0.1678, "step": 7550 }, { "epoch": 0.19, "learning_rate": 0.002715096851996081, "loss": 0.1719, "step": 7560 }, { "epoch": 0.19, "learning_rate": 0.0027147199959802024, "loss": 0.1639, "step": 7570 }, { "epoch": 0.19, "learning_rate": 0.0027143431399643246, "loss": 0.1657, "step": 7580 }, { "epoch": 0.19, "learning_rate": 0.0027139662839484463, "loss": 0.1622, "step": 7590 }, { "epoch": 0.19, "learning_rate": 0.0027135894279325676, "loss": 0.1608, "step": 7600 }, { "epoch": 0.19, "learning_rate": 0.00271321257191669, "loss": 0.1639, "step": 7610 }, { "epoch": 0.19, "learning_rate": 0.0027128357159008115, "loss": 0.1637, "step": 7620 }, { "epoch": 0.19, "learning_rate": 0.0027124588598849333, "loss": 0.1616, "step": 7630 }, { "epoch": 0.19, "learning_rate": 0.002712082003869055, "loss": 0.1625, "step": 7640 }, { "epoch": 0.19, "learning_rate": 0.0027117051478531768, "loss": 0.1658, "step": 7650 }, { "epoch": 0.19, "learning_rate": 0.002711328291837299, "loss": 0.1619, "step": 7660 }, { "epoch": 0.19, "learning_rate": 0.0027109514358214207, "loss": 0.1601, "step": 7670 }, { "epoch": 0.19, "learning_rate": 0.0027105745798055424, "loss": 0.1628, "step": 7680 }, { "epoch": 0.19, "learning_rate": 0.002710197723789664, "loss": 0.1701, "step": 7690 }, { "epoch": 0.19, "learning_rate": 0.002709820867773786, "loss": 0.1665, "step": 7700 }, { "epoch": 0.19, "learning_rate": 0.002709444011757908, "loss": 0.1698, "step": 7710 }, { "epoch": 0.19, "learning_rate": 0.0027090671557420294, "loss": 0.1634, "step": 7720 }, { "epoch": 0.19, "learning_rate": 0.002708690299726151, "loss": 0.1635, "step": 7730 }, { "epoch": 0.19, "learning_rate": 0.0027083134437102733, "loss": 0.1643, "step": 7740 }, { "epoch": 0.19, "learning_rate": 0.002707936587694395, "loss": 0.165, "step": 7750 }, { "epoch": 0.19, "learning_rate": 0.002707559731678517, "loss": 0.1601, "step": 7760 }, { "epoch": 0.2, "learning_rate": 0.0027071828756626386, "loss": 0.1633, "step": 7770 }, { "epoch": 0.2, "learning_rate": 0.0027068060196467603, "loss": 0.1602, "step": 7780 }, { "epoch": 0.2, "learning_rate": 0.002706429163630882, "loss": 0.1597, "step": 7790 }, { "epoch": 0.2, "learning_rate": 0.002706052307615004, "loss": 0.16, "step": 7800 }, { "epoch": 0.2, "learning_rate": 0.0027056754515991255, "loss": 0.1593, "step": 7810 }, { "epoch": 0.2, "learning_rate": 0.0027052985955832477, "loss": 0.1646, "step": 7820 }, { "epoch": 0.2, "learning_rate": 0.002704921739567369, "loss": 0.1648, "step": 7830 }, { "epoch": 0.2, "learning_rate": 0.0027045448835514912, "loss": 0.1686, "step": 7840 }, { "epoch": 0.2, "learning_rate": 0.002704168027535613, "loss": 0.1635, "step": 7850 }, { "epoch": 0.2, "learning_rate": 0.0027037911715197347, "loss": 0.1628, "step": 7860 }, { "epoch": 0.2, "learning_rate": 0.0027034143155038565, "loss": 0.1598, "step": 7870 }, { "epoch": 0.2, "learning_rate": 0.002703037459487978, "loss": 0.1633, "step": 7880 }, { "epoch": 0.2, "learning_rate": 0.0027026606034721004, "loss": 0.1604, "step": 7890 }, { "epoch": 0.2, "learning_rate": 0.002702283747456222, "loss": 0.1615, "step": 7900 }, { "epoch": 0.2, "learning_rate": 0.0027019068914403434, "loss": 0.1638, "step": 7910 }, { "epoch": 0.2, "learning_rate": 0.0027015300354244656, "loss": 0.1612, "step": 7920 }, { "epoch": 0.2, "learning_rate": 0.0027011531794085874, "loss": 0.1611, "step": 7930 }, { "epoch": 0.2, "learning_rate": 0.002700776323392709, "loss": 0.1629, "step": 7940 }, { "epoch": 0.2, "learning_rate": 0.002700399467376831, "loss": 0.1689, "step": 7950 }, { "epoch": 0.2, "learning_rate": 0.0027000226113609526, "loss": 0.1613, "step": 7960 }, { "epoch": 0.2, "learning_rate": 0.0026996457553450748, "loss": 0.166, "step": 7970 }, { "epoch": 0.2, "learning_rate": 0.0026992688993291965, "loss": 0.165, "step": 7980 }, { "epoch": 0.2, "learning_rate": 0.0026988920433133183, "loss": 0.1707, "step": 7990 }, { "epoch": 0.2, "learning_rate": 0.00269851518729744, "loss": 0.1575, "step": 8000 }, { "epoch": 0.2, "eval_cer": 0.6680179614409384, "eval_loss": 0.12548059225082397, "eval_runtime": 90.4279, "eval_samples_per_second": 110.574, "eval_steps_per_second": 6.912, "step": 8000 }, { "epoch": 0.2, "learning_rate": 0.0026981383312815617, "loss": 0.1597, "step": 8010 }, { "epoch": 0.2, "learning_rate": 0.0026977614752656835, "loss": 0.1661, "step": 8020 }, { "epoch": 0.2, "learning_rate": 0.0026973846192498052, "loss": 0.1591, "step": 8030 }, { "epoch": 0.2, "learning_rate": 0.002697007763233927, "loss": 0.1668, "step": 8040 }, { "epoch": 0.2, "learning_rate": 0.002696630907218049, "loss": 0.1674, "step": 8050 }, { "epoch": 0.2, "learning_rate": 0.0026962540512021705, "loss": 0.1625, "step": 8060 }, { "epoch": 0.2, "learning_rate": 0.0026958771951862926, "loss": 0.1587, "step": 8070 }, { "epoch": 0.2, "learning_rate": 0.0026955003391704144, "loss": 0.1635, "step": 8080 }, { "epoch": 0.2, "learning_rate": 0.002695123483154536, "loss": 0.1636, "step": 8090 }, { "epoch": 0.2, "learning_rate": 0.002694746627138658, "loss": 0.1598, "step": 8100 }, { "epoch": 0.2, "learning_rate": 0.0026943697711227796, "loss": 0.1644, "step": 8110 }, { "epoch": 0.2, "learning_rate": 0.002693992915106902, "loss": 0.1574, "step": 8120 }, { "epoch": 0.2, "learning_rate": 0.0026936160590910235, "loss": 0.1608, "step": 8130 }, { "epoch": 0.2, "learning_rate": 0.002693239203075145, "loss": 0.1604, "step": 8140 }, { "epoch": 0.2, "learning_rate": 0.002692862347059267, "loss": 0.1629, "step": 8150 }, { "epoch": 0.21, "learning_rate": 0.0026924854910433888, "loss": 0.1596, "step": 8160 }, { "epoch": 0.21, "learning_rate": 0.0026921086350275105, "loss": 0.1584, "step": 8170 }, { "epoch": 0.21, "learning_rate": 0.0026917317790116323, "loss": 0.1615, "step": 8180 }, { "epoch": 0.21, "learning_rate": 0.002691354922995754, "loss": 0.164, "step": 8190 }, { "epoch": 0.21, "learning_rate": 0.002690978066979876, "loss": 0.1634, "step": 8200 }, { "epoch": 0.21, "learning_rate": 0.002690601210963998, "loss": 0.156, "step": 8210 }, { "epoch": 0.21, "learning_rate": 0.0026902243549481192, "loss": 0.1569, "step": 8220 }, { "epoch": 0.21, "learning_rate": 0.0026898474989322414, "loss": 0.1591, "step": 8230 }, { "epoch": 0.21, "learning_rate": 0.002689470642916363, "loss": 0.1608, "step": 8240 }, { "epoch": 0.21, "learning_rate": 0.002689093786900485, "loss": 0.1595, "step": 8250 }, { "epoch": 0.21, "learning_rate": 0.0026887169308846067, "loss": 0.1562, "step": 8260 }, { "epoch": 0.21, "learning_rate": 0.0026883400748687284, "loss": 0.1594, "step": 8270 }, { "epoch": 0.21, "learning_rate": 0.0026879632188528506, "loss": 0.1568, "step": 8280 }, { "epoch": 0.21, "learning_rate": 0.002687586362836972, "loss": 0.1591, "step": 8290 }, { "epoch": 0.21, "learning_rate": 0.002687209506821094, "loss": 0.1639, "step": 8300 }, { "epoch": 0.21, "learning_rate": 0.002686832650805216, "loss": 0.1567, "step": 8310 }, { "epoch": 0.21, "learning_rate": 0.0026864557947893376, "loss": 0.1523, "step": 8320 }, { "epoch": 0.21, "learning_rate": 0.0026860789387734593, "loss": 0.1588, "step": 8330 }, { "epoch": 0.21, "learning_rate": 0.002685702082757581, "loss": 0.1595, "step": 8340 }, { "epoch": 0.21, "learning_rate": 0.002685325226741703, "loss": 0.1538, "step": 8350 }, { "epoch": 0.21, "learning_rate": 0.002684948370725825, "loss": 0.1553, "step": 8360 }, { "epoch": 0.21, "learning_rate": 0.0026845715147099463, "loss": 0.1606, "step": 8370 }, { "epoch": 0.21, "learning_rate": 0.0026841946586940685, "loss": 0.1583, "step": 8380 }, { "epoch": 0.21, "learning_rate": 0.00268381780267819, "loss": 0.1617, "step": 8390 }, { "epoch": 0.21, "learning_rate": 0.002683440946662312, "loss": 0.1617, "step": 8400 }, { "epoch": 0.21, "learning_rate": 0.0026830640906464337, "loss": 0.1655, "step": 8410 }, { "epoch": 0.21, "learning_rate": 0.0026826872346305554, "loss": 0.1588, "step": 8420 }, { "epoch": 0.21, "learning_rate": 0.0026823103786146776, "loss": 0.159, "step": 8430 }, { "epoch": 0.21, "learning_rate": 0.0026819335225987994, "loss": 0.1575, "step": 8440 }, { "epoch": 0.21, "learning_rate": 0.0026815566665829207, "loss": 0.1613, "step": 8450 }, { "epoch": 0.21, "learning_rate": 0.002681179810567043, "loss": 0.1639, "step": 8460 }, { "epoch": 0.21, "learning_rate": 0.0026808029545511646, "loss": 0.1566, "step": 8470 }, { "epoch": 0.21, "learning_rate": 0.0026804260985352863, "loss": 0.1544, "step": 8480 }, { "epoch": 0.21, "learning_rate": 0.002680049242519408, "loss": 0.1562, "step": 8490 }, { "epoch": 0.21, "learning_rate": 0.00267967238650353, "loss": 0.1537, "step": 8500 }, { "epoch": 0.21, "eval_cer": 0.667791783184561, "eval_loss": 0.12038606405258179, "eval_runtime": 90.1852, "eval_samples_per_second": 110.872, "eval_steps_per_second": 6.93, "step": 8500 }, { "epoch": 0.21, "learning_rate": 0.002679295530487652, "loss": 0.157, "step": 8510 }, { "epoch": 0.21, "learning_rate": 0.0026789186744717733, "loss": 0.1542, "step": 8520 }, { "epoch": 0.21, "learning_rate": 0.0026785418184558955, "loss": 0.1577, "step": 8530 }, { "epoch": 0.21, "learning_rate": 0.0026781649624400172, "loss": 0.1522, "step": 8540 }, { "epoch": 0.21, "learning_rate": 0.002677788106424139, "loss": 0.1552, "step": 8550 }, { "epoch": 0.22, "learning_rate": 0.0026774112504082607, "loss": 0.1594, "step": 8560 }, { "epoch": 0.22, "learning_rate": 0.0026770343943923825, "loss": 0.1573, "step": 8570 }, { "epoch": 0.22, "learning_rate": 0.0026766575383765042, "loss": 0.1579, "step": 8580 }, { "epoch": 0.22, "learning_rate": 0.0026762806823606264, "loss": 0.1571, "step": 8590 }, { "epoch": 0.22, "learning_rate": 0.0026759038263447477, "loss": 0.1538, "step": 8600 }, { "epoch": 0.22, "learning_rate": 0.00267552697032887, "loss": 0.1554, "step": 8610 }, { "epoch": 0.22, "learning_rate": 0.0026751501143129916, "loss": 0.1599, "step": 8620 }, { "epoch": 0.22, "learning_rate": 0.0026747732582971134, "loss": 0.1531, "step": 8630 }, { "epoch": 0.22, "learning_rate": 0.002674396402281235, "loss": 0.1559, "step": 8640 }, { "epoch": 0.22, "learning_rate": 0.002674019546265357, "loss": 0.1578, "step": 8650 }, { "epoch": 0.22, "learning_rate": 0.0026736426902494786, "loss": 0.1547, "step": 8660 }, { "epoch": 0.22, "learning_rate": 0.002673265834233601, "loss": 0.1564, "step": 8670 }, { "epoch": 0.22, "learning_rate": 0.002672888978217722, "loss": 0.1585, "step": 8680 }, { "epoch": 0.22, "learning_rate": 0.0026725121222018443, "loss": 0.1596, "step": 8690 }, { "epoch": 0.22, "learning_rate": 0.002672135266185966, "loss": 0.1595, "step": 8700 }, { "epoch": 0.22, "learning_rate": 0.0026717584101700878, "loss": 0.1609, "step": 8710 }, { "epoch": 0.22, "learning_rate": 0.0026713815541542095, "loss": 0.1543, "step": 8720 }, { "epoch": 0.22, "learning_rate": 0.0026710046981383313, "loss": 0.1536, "step": 8730 }, { "epoch": 0.22, "learning_rate": 0.0026706278421224534, "loss": 0.1575, "step": 8740 }, { "epoch": 0.22, "learning_rate": 0.0026702509861065747, "loss": 0.1567, "step": 8750 }, { "epoch": 0.22, "learning_rate": 0.0026698741300906965, "loss": 0.1524, "step": 8760 }, { "epoch": 0.22, "learning_rate": 0.0026694972740748187, "loss": 0.1548, "step": 8770 }, { "epoch": 0.22, "learning_rate": 0.0026691204180589404, "loss": 0.163, "step": 8780 }, { "epoch": 0.22, "learning_rate": 0.002668743562043062, "loss": 0.1542, "step": 8790 }, { "epoch": 0.22, "learning_rate": 0.002668366706027184, "loss": 0.1597, "step": 8800 }, { "epoch": 0.22, "learning_rate": 0.0026679898500113057, "loss": 0.1549, "step": 8810 }, { "epoch": 0.22, "learning_rate": 0.002667612993995428, "loss": 0.1563, "step": 8820 }, { "epoch": 0.22, "learning_rate": 0.002667236137979549, "loss": 0.1545, "step": 8830 }, { "epoch": 0.22, "learning_rate": 0.0026668592819636713, "loss": 0.1552, "step": 8840 }, { "epoch": 0.22, "learning_rate": 0.002666482425947793, "loss": 0.1593, "step": 8850 }, { "epoch": 0.22, "learning_rate": 0.002666105569931915, "loss": 0.157, "step": 8860 }, { "epoch": 0.22, "learning_rate": 0.0026657287139160366, "loss": 0.1524, "step": 8870 }, { "epoch": 0.22, "learning_rate": 0.0026653518579001583, "loss": 0.1548, "step": 8880 }, { "epoch": 0.22, "learning_rate": 0.00266497500188428, "loss": 0.1554, "step": 8890 }, { "epoch": 0.22, "learning_rate": 0.002664598145868402, "loss": 0.1548, "step": 8900 }, { "epoch": 0.22, "learning_rate": 0.0026642212898525235, "loss": 0.1591, "step": 8910 }, { "epoch": 0.22, "learning_rate": 0.0026638444338366457, "loss": 0.1623, "step": 8920 }, { "epoch": 0.22, "learning_rate": 0.0026634675778207675, "loss": 0.1566, "step": 8930 }, { "epoch": 0.22, "learning_rate": 0.002663090721804889, "loss": 0.1569, "step": 8940 }, { "epoch": 0.22, "learning_rate": 0.002662713865789011, "loss": 0.1552, "step": 8950 }, { "epoch": 0.23, "learning_rate": 0.0026623370097731327, "loss": 0.1543, "step": 8960 }, { "epoch": 0.23, "learning_rate": 0.0026619601537572544, "loss": 0.1516, "step": 8970 }, { "epoch": 0.23, "learning_rate": 0.002661583297741376, "loss": 0.1585, "step": 8980 }, { "epoch": 0.23, "learning_rate": 0.002661206441725498, "loss": 0.1547, "step": 8990 }, { "epoch": 0.23, "learning_rate": 0.00266082958570962, "loss": 0.1516, "step": 9000 }, { "epoch": 0.23, "eval_cer": 0.6670555007755027, "eval_loss": 0.1187540739774704, "eval_runtime": 90.5351, "eval_samples_per_second": 110.443, "eval_steps_per_second": 6.903, "step": 9000 }, { "epoch": 0.23, "learning_rate": 0.002660452729693742, "loss": 0.1551, "step": 9010 }, { "epoch": 0.23, "learning_rate": 0.0026600758736778636, "loss": 0.155, "step": 9020 }, { "epoch": 0.23, "learning_rate": 0.0026596990176619853, "loss": 0.1571, "step": 9030 }, { "epoch": 0.23, "learning_rate": 0.002659322161646107, "loss": 0.1491, "step": 9040 }, { "epoch": 0.23, "learning_rate": 0.0026589453056302293, "loss": 0.1536, "step": 9050 }, { "epoch": 0.23, "learning_rate": 0.0026585684496143506, "loss": 0.1514, "step": 9060 }, { "epoch": 0.23, "learning_rate": 0.0026581915935984723, "loss": 0.1523, "step": 9070 }, { "epoch": 0.23, "learning_rate": 0.0026578147375825945, "loss": 0.1593, "step": 9080 }, { "epoch": 0.23, "learning_rate": 0.0026574378815667162, "loss": 0.1543, "step": 9090 }, { "epoch": 0.23, "learning_rate": 0.002657061025550838, "loss": 0.159, "step": 9100 }, { "epoch": 0.23, "learning_rate": 0.0026566841695349597, "loss": 0.1543, "step": 9110 }, { "epoch": 0.23, "learning_rate": 0.0026563073135190815, "loss": 0.1497, "step": 9120 }, { "epoch": 0.23, "learning_rate": 0.002655930457503203, "loss": 0.1571, "step": 9130 }, { "epoch": 0.23, "learning_rate": 0.002655553601487325, "loss": 0.147, "step": 9140 }, { "epoch": 0.23, "learning_rate": 0.002655176745471447, "loss": 0.1499, "step": 9150 }, { "epoch": 0.23, "learning_rate": 0.002654799889455569, "loss": 0.1535, "step": 9160 }, { "epoch": 0.23, "learning_rate": 0.00265442303343969, "loss": 0.1488, "step": 9170 }, { "epoch": 0.23, "learning_rate": 0.0026540461774238124, "loss": 0.1491, "step": 9180 }, { "epoch": 0.23, "learning_rate": 0.002653669321407934, "loss": 0.1522, "step": 9190 }, { "epoch": 0.23, "learning_rate": 0.002653292465392056, "loss": 0.1526, "step": 9200 }, { "epoch": 0.23, "learning_rate": 0.0026529156093761776, "loss": 0.1534, "step": 9210 }, { "epoch": 0.23, "learning_rate": 0.0026525387533602993, "loss": 0.1514, "step": 9220 }, { "epoch": 0.23, "learning_rate": 0.0026521618973444215, "loss": 0.1523, "step": 9230 }, { "epoch": 0.23, "learning_rate": 0.0026517850413285433, "loss": 0.1571, "step": 9240 }, { "epoch": 0.23, "learning_rate": 0.002651408185312665, "loss": 0.1532, "step": 9250 }, { "epoch": 0.23, "learning_rate": 0.0026510313292967868, "loss": 0.1553, "step": 9260 }, { "epoch": 0.23, "learning_rate": 0.0026506544732809085, "loss": 0.1542, "step": 9270 }, { "epoch": 0.23, "learning_rate": 0.0026502776172650307, "loss": 0.1551, "step": 9280 }, { "epoch": 0.23, "learning_rate": 0.002649900761249152, "loss": 0.1512, "step": 9290 }, { "epoch": 0.23, "learning_rate": 0.0026495239052332737, "loss": 0.1526, "step": 9300 }, { "epoch": 0.23, "learning_rate": 0.002649147049217396, "loss": 0.1514, "step": 9310 }, { "epoch": 0.23, "learning_rate": 0.0026487701932015177, "loss": 0.1491, "step": 9320 }, { "epoch": 0.23, "learning_rate": 0.0026483933371856394, "loss": 0.1533, "step": 9330 }, { "epoch": 0.23, "learning_rate": 0.002648016481169761, "loss": 0.1565, "step": 9340 }, { "epoch": 0.23, "learning_rate": 0.002647639625153883, "loss": 0.1524, "step": 9350 }, { "epoch": 0.24, "learning_rate": 0.0026472627691380046, "loss": 0.1549, "step": 9360 }, { "epoch": 0.24, "learning_rate": 0.0026468859131221264, "loss": 0.1529, "step": 9370 }, { "epoch": 0.24, "learning_rate": 0.002646509057106248, "loss": 0.1491, "step": 9380 }, { "epoch": 0.24, "learning_rate": 0.0026461322010903703, "loss": 0.1525, "step": 9390 }, { "epoch": 0.24, "learning_rate": 0.0026457553450744916, "loss": 0.1459, "step": 9400 }, { "epoch": 0.24, "learning_rate": 0.002645378489058614, "loss": 0.1476, "step": 9410 }, { "epoch": 0.24, "learning_rate": 0.0026450016330427355, "loss": 0.1494, "step": 9420 }, { "epoch": 0.24, "learning_rate": 0.0026446247770268573, "loss": 0.1497, "step": 9430 }, { "epoch": 0.24, "learning_rate": 0.002644247921010979, "loss": 0.1502, "step": 9440 }, { "epoch": 0.24, "learning_rate": 0.0026438710649951008, "loss": 0.15, "step": 9450 }, { "epoch": 0.24, "learning_rate": 0.002643494208979223, "loss": 0.1536, "step": 9460 }, { "epoch": 0.24, "learning_rate": 0.0026431173529633447, "loss": 0.151, "step": 9470 }, { "epoch": 0.24, "learning_rate": 0.002642740496947466, "loss": 0.1478, "step": 9480 }, { "epoch": 0.24, "learning_rate": 0.002642363640931588, "loss": 0.1505, "step": 9490 }, { "epoch": 0.24, "learning_rate": 0.00264198678491571, "loss": 0.1526, "step": 9500 }, { "epoch": 0.24, "eval_cer": 0.667285047644209, "eval_loss": 0.11501982808113098, "eval_runtime": 89.9198, "eval_samples_per_second": 111.199, "eval_steps_per_second": 6.951, "step": 9500 }, { "epoch": 0.24, "learning_rate": 0.0026416099288998317, "loss": 0.1529, "step": 9510 }, { "epoch": 0.24, "learning_rate": 0.0026412330728839534, "loss": 0.1544, "step": 9520 }, { "epoch": 0.24, "learning_rate": 0.002640856216868075, "loss": 0.1497, "step": 9530 }, { "epoch": 0.24, "learning_rate": 0.0026404793608521973, "loss": 0.1521, "step": 9540 }, { "epoch": 0.24, "learning_rate": 0.002640102504836319, "loss": 0.1553, "step": 9550 }, { "epoch": 0.24, "learning_rate": 0.002639725648820441, "loss": 0.149, "step": 9560 }, { "epoch": 0.24, "learning_rate": 0.0026393487928045626, "loss": 0.1555, "step": 9570 }, { "epoch": 0.24, "learning_rate": 0.0026389719367886843, "loss": 0.1505, "step": 9580 }, { "epoch": 0.24, "learning_rate": 0.002638595080772806, "loss": 0.1515, "step": 9590 }, { "epoch": 0.24, "learning_rate": 0.002638218224756928, "loss": 0.1544, "step": 9600 }, { "epoch": 0.24, "learning_rate": 0.0026378413687410496, "loss": 0.1442, "step": 9610 }, { "epoch": 0.24, "learning_rate": 0.0026374645127251717, "loss": 0.1497, "step": 9620 }, { "epoch": 0.24, "learning_rate": 0.002637087656709293, "loss": 0.1522, "step": 9630 }, { "epoch": 0.24, "learning_rate": 0.0026367108006934152, "loss": 0.1506, "step": 9640 }, { "epoch": 0.24, "learning_rate": 0.002636333944677537, "loss": 0.1538, "step": 9650 }, { "epoch": 0.24, "learning_rate": 0.0026359570886616587, "loss": 0.1514, "step": 9660 }, { "epoch": 0.24, "learning_rate": 0.0026355802326457805, "loss": 0.1471, "step": 9670 }, { "epoch": 0.24, "learning_rate": 0.002635203376629902, "loss": 0.1514, "step": 9680 }, { "epoch": 0.24, "learning_rate": 0.0026348265206140244, "loss": 0.148, "step": 9690 }, { "epoch": 0.24, "learning_rate": 0.002634449664598146, "loss": 0.1483, "step": 9700 }, { "epoch": 0.24, "learning_rate": 0.0026340728085822674, "loss": 0.1489, "step": 9710 }, { "epoch": 0.24, "learning_rate": 0.0026336959525663896, "loss": 0.153, "step": 9720 }, { "epoch": 0.24, "learning_rate": 0.0026333190965505114, "loss": 0.1479, "step": 9730 }, { "epoch": 0.24, "learning_rate": 0.002632942240534633, "loss": 0.1529, "step": 9740 }, { "epoch": 0.24, "learning_rate": 0.002632565384518755, "loss": 0.152, "step": 9750 }, { "epoch": 0.25, "learning_rate": 0.0026321885285028766, "loss": 0.147, "step": 9760 }, { "epoch": 0.25, "learning_rate": 0.0026318116724869988, "loss": 0.1452, "step": 9770 }, { "epoch": 0.25, "learning_rate": 0.0026314348164711205, "loss": 0.1497, "step": 9780 }, { "epoch": 0.25, "learning_rate": 0.002631057960455242, "loss": 0.1526, "step": 9790 }, { "epoch": 0.25, "learning_rate": 0.002630681104439364, "loss": 0.148, "step": 9800 }, { "epoch": 0.25, "learning_rate": 0.0026303042484234858, "loss": 0.1471, "step": 9810 }, { "epoch": 0.25, "learning_rate": 0.0026299273924076075, "loss": 0.1492, "step": 9820 }, { "epoch": 0.25, "learning_rate": 0.0026295505363917292, "loss": 0.1562, "step": 9830 }, { "epoch": 0.25, "learning_rate": 0.002629173680375851, "loss": 0.1489, "step": 9840 }, { "epoch": 0.25, "learning_rate": 0.002628796824359973, "loss": 0.1514, "step": 9850 }, { "epoch": 0.25, "learning_rate": 0.0026284199683440945, "loss": 0.1559, "step": 9860 }, { "epoch": 0.25, "learning_rate": 0.0026280431123282167, "loss": 0.1519, "step": 9870 }, { "epoch": 0.25, "learning_rate": 0.0026276662563123384, "loss": 0.1481, "step": 9880 }, { "epoch": 0.25, "learning_rate": 0.00262728940029646, "loss": 0.1425, "step": 9890 }, { "epoch": 0.25, "learning_rate": 0.002626912544280582, "loss": 0.1518, "step": 9900 }, { "epoch": 0.25, "learning_rate": 0.0026265356882647036, "loss": 0.1476, "step": 9910 }, { "epoch": 0.25, "learning_rate": 0.0026261588322488254, "loss": 0.1456, "step": 9920 }, { "epoch": 0.25, "learning_rate": 0.0026257819762329476, "loss": 0.1481, "step": 9930 }, { "epoch": 0.25, "learning_rate": 0.002625405120217069, "loss": 0.146, "step": 9940 }, { "epoch": 0.25, "learning_rate": 0.002625028264201191, "loss": 0.155, "step": 9950 }, { "epoch": 0.25, "learning_rate": 0.002624651408185313, "loss": 0.1448, "step": 9960 }, { "epoch": 0.25, "learning_rate": 0.0026242745521694345, "loss": 0.1575, "step": 9970 }, { "epoch": 0.25, "learning_rate": 0.0026238976961535563, "loss": 0.1424, "step": 9980 }, { "epoch": 0.25, "learning_rate": 0.002623520840137678, "loss": 0.1496, "step": 9990 }, { "epoch": 0.25, "learning_rate": 0.0026231439841218, "loss": 0.148, "step": 10000 }, { "epoch": 0.25, "eval_cer": 0.6675872602931558, "eval_loss": 0.11312033236026764, "eval_runtime": 90.4563, "eval_samples_per_second": 110.54, "eval_steps_per_second": 6.909, "step": 10000 }, { "epoch": 0.25, "learning_rate": 0.002622767128105922, "loss": 0.1537, "step": 10010 }, { "epoch": 0.25, "learning_rate": 0.0026223902720900433, "loss": 0.1447, "step": 10020 }, { "epoch": 0.25, "learning_rate": 0.0026220134160741654, "loss": 0.1481, "step": 10030 }, { "epoch": 0.25, "learning_rate": 0.002621636560058287, "loss": 0.1485, "step": 10040 }, { "epoch": 0.25, "learning_rate": 0.002621259704042409, "loss": 0.1495, "step": 10050 }, { "epoch": 0.25, "learning_rate": 0.0026208828480265307, "loss": 0.1483, "step": 10060 }, { "epoch": 0.25, "learning_rate": 0.0026205059920106524, "loss": 0.1487, "step": 10070 }, { "epoch": 0.25, "learning_rate": 0.0026201291359947746, "loss": 0.1462, "step": 10080 }, { "epoch": 0.25, "learning_rate": 0.002619752279978896, "loss": 0.1475, "step": 10090 }, { "epoch": 0.25, "learning_rate": 0.002619375423963018, "loss": 0.1431, "step": 10100 }, { "epoch": 0.25, "learning_rate": 0.00261899856794714, "loss": 0.1455, "step": 10110 }, { "epoch": 0.25, "learning_rate": 0.0026186217119312616, "loss": 0.1504, "step": 10120 }, { "epoch": 0.25, "learning_rate": 0.0026182448559153833, "loss": 0.1509, "step": 10130 }, { "epoch": 0.25, "learning_rate": 0.002617867999899505, "loss": 0.1464, "step": 10140 }, { "epoch": 0.26, "learning_rate": 0.002617491143883627, "loss": 0.1461, "step": 10150 }, { "epoch": 0.26, "learning_rate": 0.002617114287867749, "loss": 0.1512, "step": 10160 }, { "epoch": 0.26, "learning_rate": 0.0026167374318518703, "loss": 0.1487, "step": 10170 }, { "epoch": 0.26, "learning_rate": 0.0026163605758359925, "loss": 0.1443, "step": 10180 }, { "epoch": 0.26, "learning_rate": 0.002615983719820114, "loss": 0.1492, "step": 10190 }, { "epoch": 0.26, "learning_rate": 0.002615606863804236, "loss": 0.1496, "step": 10200 }, { "epoch": 0.26, "learning_rate": 0.0026152300077883577, "loss": 0.1457, "step": 10210 }, { "epoch": 0.26, "learning_rate": 0.0026148531517724794, "loss": 0.1477, "step": 10220 }, { "epoch": 0.26, "learning_rate": 0.002614476295756601, "loss": 0.144, "step": 10230 }, { "epoch": 0.26, "learning_rate": 0.002614099439740723, "loss": 0.1474, "step": 10240 }, { "epoch": 0.26, "learning_rate": 0.0026137225837248447, "loss": 0.1468, "step": 10250 }, { "epoch": 0.26, "learning_rate": 0.002613345727708967, "loss": 0.1448, "step": 10260 }, { "epoch": 0.26, "learning_rate": 0.0026129688716930886, "loss": 0.1464, "step": 10270 }, { "epoch": 0.26, "learning_rate": 0.0026125920156772104, "loss": 0.143, "step": 10280 }, { "epoch": 0.26, "learning_rate": 0.002612215159661332, "loss": 0.1482, "step": 10290 }, { "epoch": 0.26, "learning_rate": 0.002611838303645454, "loss": 0.1453, "step": 10300 }, { "epoch": 0.26, "learning_rate": 0.002611461447629576, "loss": 0.1499, "step": 10310 }, { "epoch": 0.26, "learning_rate": 0.0026110845916136973, "loss": 0.1463, "step": 10320 }, { "epoch": 0.26, "learning_rate": 0.002610707735597819, "loss": 0.1485, "step": 10330 }, { "epoch": 0.26, "learning_rate": 0.0026103308795819413, "loss": 0.1493, "step": 10340 }, { "epoch": 0.26, "learning_rate": 0.002609954023566063, "loss": 0.1432, "step": 10350 }, { "epoch": 0.26, "learning_rate": 0.0026095771675501847, "loss": 0.1503, "step": 10360 }, { "epoch": 0.26, "learning_rate": 0.0026092003115343065, "loss": 0.1481, "step": 10370 }, { "epoch": 0.26, "learning_rate": 0.0026088234555184282, "loss": 0.1472, "step": 10380 }, { "epoch": 0.26, "learning_rate": 0.0026084465995025504, "loss": 0.1439, "step": 10390 }, { "epoch": 0.26, "learning_rate": 0.0026080697434866717, "loss": 0.1449, "step": 10400 }, { "epoch": 0.26, "learning_rate": 0.002607692887470794, "loss": 0.1412, "step": 10410 }, { "epoch": 0.26, "learning_rate": 0.0026073160314549156, "loss": 0.1421, "step": 10420 }, { "epoch": 0.26, "learning_rate": 0.0026069391754390374, "loss": 0.1427, "step": 10430 }, { "epoch": 0.26, "learning_rate": 0.002606562319423159, "loss": 0.1467, "step": 10440 }, { "epoch": 0.26, "learning_rate": 0.002606185463407281, "loss": 0.1415, "step": 10450 }, { "epoch": 0.26, "learning_rate": 0.0026058086073914026, "loss": 0.1461, "step": 10460 }, { "epoch": 0.26, "learning_rate": 0.0026054317513755244, "loss": 0.1455, "step": 10470 }, { "epoch": 0.26, "learning_rate": 0.002605054895359646, "loss": 0.1416, "step": 10480 }, { "epoch": 0.26, "learning_rate": 0.0026046780393437683, "loss": 0.1482, "step": 10490 }, { "epoch": 0.26, "learning_rate": 0.00260430118332789, "loss": 0.1445, "step": 10500 }, { "epoch": 0.26, "eval_cer": 0.667484758232287, "eval_loss": 0.11072567105293274, "eval_runtime": 90.1742, "eval_samples_per_second": 110.885, "eval_steps_per_second": 6.931, "step": 10500 }, { "epoch": 0.26, "learning_rate": 0.0026039243273120118, "loss": 0.1448, "step": 10510 }, { "epoch": 0.26, "learning_rate": 0.0026035474712961335, "loss": 0.1456, "step": 10520 }, { "epoch": 0.26, "learning_rate": 0.0026031706152802553, "loss": 0.1453, "step": 10530 }, { "epoch": 0.26, "learning_rate": 0.002602793759264377, "loss": 0.147, "step": 10540 }, { "epoch": 0.27, "learning_rate": 0.0026024169032484988, "loss": 0.1432, "step": 10550 }, { "epoch": 0.27, "learning_rate": 0.0026020400472326205, "loss": 0.1412, "step": 10560 }, { "epoch": 0.27, "learning_rate": 0.0026016631912167427, "loss": 0.143, "step": 10570 }, { "epoch": 0.27, "learning_rate": 0.0026012863352008644, "loss": 0.1455, "step": 10580 }, { "epoch": 0.27, "learning_rate": 0.002600909479184986, "loss": 0.1461, "step": 10590 }, { "epoch": 0.27, "learning_rate": 0.002600532623169108, "loss": 0.1469, "step": 10600 }, { "epoch": 0.27, "learning_rate": 0.0026001557671532297, "loss": 0.1434, "step": 10610 }, { "epoch": 0.27, "learning_rate": 0.002599778911137352, "loss": 0.1427, "step": 10620 }, { "epoch": 0.27, "learning_rate": 0.002599402055121473, "loss": 0.1433, "step": 10630 }, { "epoch": 0.27, "learning_rate": 0.002599025199105595, "loss": 0.1423, "step": 10640 }, { "epoch": 0.27, "learning_rate": 0.002598648343089717, "loss": 0.1437, "step": 10650 }, { "epoch": 0.27, "learning_rate": 0.002598271487073839, "loss": 0.1428, "step": 10660 }, { "epoch": 0.27, "learning_rate": 0.0025978946310579606, "loss": 0.1399, "step": 10670 }, { "epoch": 0.27, "learning_rate": 0.0025975177750420823, "loss": 0.1451, "step": 10680 }, { "epoch": 0.27, "learning_rate": 0.002597140919026204, "loss": 0.1415, "step": 10690 }, { "epoch": 0.27, "learning_rate": 0.002596764063010326, "loss": 0.1459, "step": 10700 }, { "epoch": 0.27, "learning_rate": 0.0025963872069944475, "loss": 0.1434, "step": 10710 }, { "epoch": 0.27, "learning_rate": 0.0025960103509785697, "loss": 0.1413, "step": 10720 }, { "epoch": 0.27, "learning_rate": 0.0025956334949626915, "loss": 0.1446, "step": 10730 }, { "epoch": 0.27, "learning_rate": 0.0025952566389468128, "loss": 0.1448, "step": 10740 }, { "epoch": 0.27, "learning_rate": 0.002594879782930935, "loss": 0.1407, "step": 10750 }, { "epoch": 0.27, "learning_rate": 0.0025945029269150567, "loss": 0.1408, "step": 10760 }, { "epoch": 0.27, "learning_rate": 0.0025941260708991784, "loss": 0.1419, "step": 10770 }, { "epoch": 0.27, "learning_rate": 0.0025937492148833, "loss": 0.1484, "step": 10780 }, { "epoch": 0.27, "learning_rate": 0.002593372358867422, "loss": 0.143, "step": 10790 }, { "epoch": 0.27, "learning_rate": 0.002592995502851544, "loss": 0.1421, "step": 10800 }, { "epoch": 0.27, "learning_rate": 0.002592618646835666, "loss": 0.1387, "step": 10810 }, { "epoch": 0.27, "learning_rate": 0.0025922417908197876, "loss": 0.1425, "step": 10820 }, { "epoch": 0.27, "learning_rate": 0.0025918649348039093, "loss": 0.1439, "step": 10830 }, { "epoch": 0.27, "learning_rate": 0.002591488078788031, "loss": 0.141, "step": 10840 }, { "epoch": 0.27, "learning_rate": 0.0025911112227721533, "loss": 0.1422, "step": 10850 }, { "epoch": 0.27, "learning_rate": 0.0025907343667562746, "loss": 0.1427, "step": 10860 }, { "epoch": 0.27, "learning_rate": 0.0025903575107403963, "loss": 0.1419, "step": 10870 }, { "epoch": 0.27, "learning_rate": 0.0025899806547245185, "loss": 0.1379, "step": 10880 }, { "epoch": 0.27, "learning_rate": 0.0025896037987086402, "loss": 0.1473, "step": 10890 }, { "epoch": 0.27, "learning_rate": 0.002589226942692762, "loss": 0.1432, "step": 10900 }, { "epoch": 0.27, "learning_rate": 0.0025888500866768837, "loss": 0.1424, "step": 10910 }, { "epoch": 0.27, "learning_rate": 0.0025884732306610055, "loss": 0.1451, "step": 10920 }, { "epoch": 0.27, "learning_rate": 0.0025880963746451272, "loss": 0.1381, "step": 10930 }, { "epoch": 0.27, "learning_rate": 0.002587719518629249, "loss": 0.1393, "step": 10940 }, { "epoch": 0.28, "learning_rate": 0.0025873426626133707, "loss": 0.141, "step": 10950 }, { "epoch": 0.28, "learning_rate": 0.002586965806597493, "loss": 0.1405, "step": 10960 }, { "epoch": 0.28, "learning_rate": 0.002586588950581614, "loss": 0.1392, "step": 10970 }, { "epoch": 0.28, "learning_rate": 0.0025862120945657364, "loss": 0.1428, "step": 10980 }, { "epoch": 0.28, "learning_rate": 0.002585835238549858, "loss": 0.1447, "step": 10990 }, { "epoch": 0.28, "learning_rate": 0.00258545838253398, "loss": 0.1378, "step": 11000 }, { "epoch": 0.28, "eval_cer": 0.6664130582813244, "eval_loss": 0.111346036195755, "eval_runtime": 90.4938, "eval_samples_per_second": 110.494, "eval_steps_per_second": 6.907, "step": 11000 }, { "epoch": 0.28, "learning_rate": 0.0025850815265181016, "loss": 0.1417, "step": 11010 }, { "epoch": 0.28, "learning_rate": 0.0025847046705022234, "loss": 0.1412, "step": 11020 }, { "epoch": 0.28, "learning_rate": 0.0025843278144863455, "loss": 0.1388, "step": 11030 }, { "epoch": 0.28, "learning_rate": 0.0025839509584704673, "loss": 0.1448, "step": 11040 }, { "epoch": 0.28, "learning_rate": 0.0025835741024545886, "loss": 0.1433, "step": 11050 }, { "epoch": 0.28, "learning_rate": 0.0025831972464387108, "loss": 0.1429, "step": 11060 }, { "epoch": 0.28, "learning_rate": 0.0025828203904228325, "loss": 0.1434, "step": 11070 }, { "epoch": 0.28, "learning_rate": 0.0025824435344069543, "loss": 0.1394, "step": 11080 }, { "epoch": 0.28, "learning_rate": 0.002582066678391076, "loss": 0.1412, "step": 11090 }, { "epoch": 0.28, "learning_rate": 0.0025816898223751977, "loss": 0.1464, "step": 11100 }, { "epoch": 0.28, "learning_rate": 0.00258131296635932, "loss": 0.1395, "step": 11110 }, { "epoch": 0.28, "learning_rate": 0.0025809361103434417, "loss": 0.1418, "step": 11120 }, { "epoch": 0.28, "learning_rate": 0.0025805592543275634, "loss": 0.1392, "step": 11130 }, { "epoch": 0.28, "learning_rate": 0.002580182398311685, "loss": 0.1393, "step": 11140 }, { "epoch": 0.28, "learning_rate": 0.002579805542295807, "loss": 0.1404, "step": 11150 }, { "epoch": 0.28, "learning_rate": 0.0025794286862799286, "loss": 5.9387, "step": 11160 }, { "epoch": 0.28, "learning_rate": 0.0025790518302640504, "loss": 7.2621, "step": 11170 }, { "epoch": 0.28, "learning_rate": 0.002578674974248172, "loss": 6.7929, "step": 11180 }, { "epoch": 0.28, "learning_rate": 0.0025782981182322943, "loss": 7.9889, "step": 11190 }, { "epoch": 0.28, "learning_rate": 0.0025779212622164156, "loss": 7.8188, "step": 11200 }, { "epoch": 0.28, "learning_rate": 0.002577544406200538, "loss": 7.1258, "step": 11210 }, { "epoch": 0.28, "learning_rate": 0.0025771675501846595, "loss": 6.8801, "step": 11220 }, { "epoch": 0.28, "learning_rate": 0.0025767906941687813, "loss": 6.7671, "step": 11230 }, { "epoch": 0.28, "learning_rate": 0.002576413838152903, "loss": 6.5726, "step": 11240 }, { "epoch": 0.28, "learning_rate": 0.002576036982137025, "loss": 6.2308, "step": 11250 }, { "epoch": 0.28, "learning_rate": 0.002575660126121147, "loss": 6.2539, "step": 11260 }, { "epoch": 0.28, "learning_rate": 0.0025752832701052687, "loss": 7.1063, "step": 11270 }, { "epoch": 0.28, "learning_rate": 0.00257490641408939, "loss": 6.5323, "step": 11280 }, { "epoch": 0.28, "learning_rate": 0.002574529558073512, "loss": 6.2713, "step": 11290 }, { "epoch": 0.28, "learning_rate": 0.002574152702057634, "loss": 6.0892, "step": 11300 }, { "epoch": 0.28, "learning_rate": 0.0025737758460417557, "loss": 6.2819, "step": 11310 }, { "epoch": 0.28, "learning_rate": 0.0025733989900258774, "loss": 6.2821, "step": 11320 }, { "epoch": 0.28, "learning_rate": 0.002573022134009999, "loss": 6.1237, "step": 11330 }, { "epoch": 0.28, "learning_rate": 0.0025726452779941214, "loss": 6.0933, "step": 11340 }, { "epoch": 0.29, "learning_rate": 0.0025722684219782427, "loss": 6.2318, "step": 11350 }, { "epoch": 0.29, "learning_rate": 0.0025718915659623644, "loss": 6.0266, "step": 11360 }, { "epoch": 0.29, "learning_rate": 0.0025715147099464866, "loss": 5.8218, "step": 11370 }, { "epoch": 0.29, "learning_rate": 0.0025711378539306083, "loss": 5.8923, "step": 11380 }, { "epoch": 0.29, "learning_rate": 0.00257076099791473, "loss": 5.8399, "step": 11390 }, { "epoch": 0.29, "learning_rate": 0.002570384141898852, "loss": 5.9417, "step": 11400 }, { "epoch": 0.29, "learning_rate": 0.0025700072858829736, "loss": 5.9609, "step": 11410 }, { "epoch": 0.29, "learning_rate": 0.0025696304298670957, "loss": 6.7493, "step": 11420 }, { "epoch": 0.29, "learning_rate": 0.002569253573851217, "loss": 6.8029, "step": 11430 }, { "epoch": 0.29, "learning_rate": 0.0025688767178353392, "loss": 6.3757, "step": 11440 }, { "epoch": 0.29, "learning_rate": 0.002568499861819461, "loss": 6.2486, "step": 11450 }, { "epoch": 0.29, "learning_rate": 0.0025681230058035827, "loss": 6.15, "step": 11460 }, { "epoch": 0.29, "learning_rate": 0.0025677461497877045, "loss": 6.1534, "step": 11470 }, { "epoch": 0.29, "learning_rate": 0.002567369293771826, "loss": 6.0945, "step": 11480 }, { "epoch": 0.29, "learning_rate": 0.002566992437755948, "loss": 6.1041, "step": 11490 }, { "epoch": 0.29, "learning_rate": 0.00256661558174007, "loss": 6.1099, "step": 11500 }, { "epoch": 0.29, "eval_cer": 0.8805047336221677, "eval_loss": 6.048417091369629, "eval_runtime": 90.456, "eval_samples_per_second": 110.54, "eval_steps_per_second": 6.909, "step": 11500 }, { "epoch": 0.29, "learning_rate": 0.0025662387257241914, "loss": 6.1748, "step": 11510 }, { "epoch": 0.29, "learning_rate": 0.0025658618697083136, "loss": 6.2297, "step": 11520 }, { "epoch": 0.29, "learning_rate": 0.0025654850136924354, "loss": 6.2931, "step": 11530 }, { "epoch": 0.29, "learning_rate": 0.002565108157676557, "loss": 6.3084, "step": 11540 }, { "epoch": 0.29, "learning_rate": 0.002564731301660679, "loss": 6.2893, "step": 11550 }, { "epoch": 0.29, "learning_rate": 0.0025643544456448006, "loss": 6.273, "step": 11560 }, { "epoch": 0.29, "learning_rate": 0.0025639775896289228, "loss": 6.2783, "step": 11570 }, { "epoch": 0.29, "learning_rate": 0.002563600733613044, "loss": 6.2444, "step": 11580 }, { "epoch": 0.29, "learning_rate": 0.002563223877597166, "loss": 6.2464, "step": 11590 }, { "epoch": 0.29, "learning_rate": 0.002562847021581288, "loss": 6.3133, "step": 11600 }, { "epoch": 0.29, "learning_rate": 0.0025624701655654098, "loss": 6.1791, "step": 11610 }, { "epoch": 0.29, "learning_rate": 0.0025620933095495315, "loss": 6.0017, "step": 11620 }, { "epoch": 0.29, "learning_rate": 0.0025617164535336532, "loss": 5.9354, "step": 11630 }, { "epoch": 0.29, "learning_rate": 0.002561339597517775, "loss": 5.9088, "step": 11640 }, { "epoch": 0.29, "learning_rate": 0.002560962741501897, "loss": 5.8717, "step": 11650 }, { "epoch": 0.29, "learning_rate": 0.0025605858854860185, "loss": 5.8255, "step": 11660 }, { "epoch": 0.29, "learning_rate": 0.0025602090294701407, "loss": 5.7379, "step": 11670 }, { "epoch": 0.29, "learning_rate": 0.0025598321734542624, "loss": 5.7158, "step": 11680 }, { "epoch": 0.29, "learning_rate": 0.002559455317438384, "loss": 5.667, "step": 11690 }, { "epoch": 0.29, "learning_rate": 0.002559078461422506, "loss": 5.62, "step": 11700 }, { "epoch": 0.29, "learning_rate": 0.0025587016054066276, "loss": 5.5561, "step": 11710 }, { "epoch": 0.29, "learning_rate": 0.0025583247493907494, "loss": 5.5272, "step": 11720 }, { "epoch": 0.29, "learning_rate": 0.0025579478933748716, "loss": 5.4919, "step": 11730 }, { "epoch": 0.29, "learning_rate": 0.002557571037358993, "loss": 5.4039, "step": 11740 }, { "epoch": 0.3, "learning_rate": 0.002557194181343115, "loss": 5.323, "step": 11750 }, { "epoch": 0.3, "learning_rate": 0.002556817325327237, "loss": 5.2373, "step": 11760 }, { "epoch": 0.3, "learning_rate": 0.0025564404693113585, "loss": 5.1487, "step": 11770 }, { "epoch": 0.3, "learning_rate": 0.0025560636132954803, "loss": 5.1224, "step": 11780 }, { "epoch": 0.3, "learning_rate": 0.002555686757279602, "loss": 5.408, "step": 11790 }, { "epoch": 0.3, "learning_rate": 0.0025553099012637238, "loss": 6.0158, "step": 11800 }, { "epoch": 0.3, "learning_rate": 0.0025549330452478455, "loss": 6.0681, "step": 11810 }, { "epoch": 0.3, "learning_rate": 0.0025545561892319673, "loss": 5.6654, "step": 11820 }, { "epoch": 0.3, "learning_rate": 0.0025541793332160894, "loss": 5.3601, "step": 11830 }, { "epoch": 0.3, "learning_rate": 0.002553802477200211, "loss": 5.2609, "step": 11840 }, { "epoch": 0.3, "learning_rate": 0.002553425621184333, "loss": 5.2451, "step": 11850 }, { "epoch": 0.3, "learning_rate": 0.0025530487651684547, "loss": 5.208, "step": 11860 }, { "epoch": 0.3, "learning_rate": 0.0025526719091525764, "loss": 5.1566, "step": 11870 }, { "epoch": 0.3, "learning_rate": 0.0025522950531366986, "loss": 5.8534, "step": 11880 }, { "epoch": 0.3, "learning_rate": 0.00255191819712082, "loss": 6.3235, "step": 11890 }, { "epoch": 0.3, "learning_rate": 0.0025515413411049417, "loss": 6.0392, "step": 11900 }, { "epoch": 0.3, "learning_rate": 0.002551164485089064, "loss": 5.5035, "step": 11910 }, { "epoch": 0.3, "learning_rate": 0.0025507876290731856, "loss": 5.1853, "step": 11920 }, { "epoch": 0.3, "learning_rate": 0.0025504107730573073, "loss": 5.0908, "step": 11930 }, { "epoch": 0.3, "learning_rate": 0.002550033917041429, "loss": 5.0612, "step": 11940 }, { "epoch": 0.3, "learning_rate": 0.002549657061025551, "loss": 5.1003, "step": 11950 }, { "epoch": 0.3, "learning_rate": 0.002549280205009673, "loss": 5.0377, "step": 11960 }, { "epoch": 0.3, "learning_rate": 0.0025489033489937943, "loss": 4.9801, "step": 11970 }, { "epoch": 0.3, "learning_rate": 0.0025485264929779165, "loss": 4.9317, "step": 11980 }, { "epoch": 0.3, "learning_rate": 0.0025481496369620382, "loss": 4.9793, "step": 11990 }, { "epoch": 0.3, "learning_rate": 0.00254777278094616, "loss": 4.9528, "step": 12000 }, { "epoch": 0.3, "eval_cer": 0.811528065112389, "eval_loss": 4.661426067352295, "eval_runtime": 90.744, "eval_samples_per_second": 110.189, "eval_steps_per_second": 6.888, "step": 12000 }, { "epoch": 0.3, "learning_rate": 0.0025473959249302817, "loss": 4.9223, "step": 12010 }, { "epoch": 0.3, "learning_rate": 0.0025470190689144035, "loss": 4.8947, "step": 12020 }, { "epoch": 0.3, "learning_rate": 0.002546642212898525, "loss": 4.8087, "step": 12030 }, { "epoch": 0.3, "learning_rate": 0.002546265356882647, "loss": 4.786, "step": 12040 }, { "epoch": 0.3, "learning_rate": 0.0025458885008667687, "loss": 4.7338, "step": 12050 }, { "epoch": 0.3, "learning_rate": 0.002545511644850891, "loss": 4.7176, "step": 12060 }, { "epoch": 0.3, "learning_rate": 0.0025451347888350126, "loss": 4.7573, "step": 12070 }, { "epoch": 0.3, "learning_rate": 0.0025447579328191344, "loss": 4.7873, "step": 12080 }, { "epoch": 0.3, "learning_rate": 0.002544381076803256, "loss": 4.7283, "step": 12090 }, { "epoch": 0.3, "learning_rate": 0.002544004220787378, "loss": 4.674, "step": 12100 }, { "epoch": 0.3, "learning_rate": 0.0025436273647714996, "loss": 4.7024, "step": 12110 }, { "epoch": 0.3, "learning_rate": 0.0025432505087556213, "loss": 4.7434, "step": 12120 }, { "epoch": 0.3, "learning_rate": 0.002542873652739743, "loss": 4.6647, "step": 12130 }, { "epoch": 0.3, "learning_rate": 0.0025424967967238653, "loss": 4.6216, "step": 12140 }, { "epoch": 0.31, "learning_rate": 0.002542119940707987, "loss": 4.636, "step": 12150 }, { "epoch": 0.31, "learning_rate": 0.0025417430846921087, "loss": 4.6511, "step": 12160 }, { "epoch": 0.31, "learning_rate": 0.0025413662286762305, "loss": 4.5795, "step": 12170 }, { "epoch": 0.31, "learning_rate": 0.0025409893726603522, "loss": 4.4972, "step": 12180 }, { "epoch": 0.31, "learning_rate": 0.0025406125166444744, "loss": 4.435, "step": 12190 }, { "epoch": 0.31, "learning_rate": 0.0025402356606285957, "loss": 4.379, "step": 12200 }, { "epoch": 0.31, "learning_rate": 0.0025398588046127175, "loss": 4.3485, "step": 12210 }, { "epoch": 0.31, "learning_rate": 0.0025394819485968396, "loss": 4.2845, "step": 12220 }, { "epoch": 0.31, "learning_rate": 0.0025391050925809614, "loss": 4.1975, "step": 12230 }, { "epoch": 0.31, "learning_rate": 0.002538728236565083, "loss": 3.0927, "step": 12240 }, { "epoch": 0.31, "learning_rate": 0.002538351380549205, "loss": 1.1231, "step": 12250 }, { "epoch": 0.31, "learning_rate": 0.0025379745245333266, "loss": 0.566, "step": 12260 }, { "epoch": 0.31, "learning_rate": 0.0025375976685174484, "loss": 0.4869, "step": 12270 }, { "epoch": 0.31, "learning_rate": 0.00253722081250157, "loss": 0.4279, "step": 12280 }, { "epoch": 0.31, "learning_rate": 0.0025368439564856923, "loss": 0.4044, "step": 12290 }, { "epoch": 0.31, "learning_rate": 0.002536467100469814, "loss": 0.3643, "step": 12300 }, { "epoch": 0.31, "learning_rate": 0.0025360902444539354, "loss": 0.4048, "step": 12310 }, { "epoch": 0.31, "learning_rate": 0.0025357133884380575, "loss": 0.3471, "step": 12320 }, { "epoch": 0.31, "learning_rate": 0.0025353365324221793, "loss": 0.3162, "step": 12330 }, { "epoch": 0.31, "learning_rate": 0.002534959676406301, "loss": 0.2862, "step": 12340 }, { "epoch": 0.31, "learning_rate": 0.0025345828203904228, "loss": 0.2789, "step": 12350 }, { "epoch": 0.31, "learning_rate": 0.0025342059643745445, "loss": 0.2707, "step": 12360 }, { "epoch": 0.31, "learning_rate": 0.0025338291083586667, "loss": 0.255, "step": 12370 }, { "epoch": 0.31, "learning_rate": 0.0025334522523427884, "loss": 0.2596, "step": 12380 }, { "epoch": 0.31, "learning_rate": 0.00253307539632691, "loss": 0.2378, "step": 12390 }, { "epoch": 0.31, "learning_rate": 0.002532698540311032, "loss": 0.2396, "step": 12400 }, { "epoch": 0.31, "learning_rate": 0.0025323216842951537, "loss": 0.2339, "step": 12410 }, { "epoch": 0.31, "learning_rate": 0.002531944828279276, "loss": 0.2316, "step": 12420 }, { "epoch": 0.31, "learning_rate": 0.002531567972263397, "loss": 0.2366, "step": 12430 }, { "epoch": 0.31, "learning_rate": 0.002531191116247519, "loss": 0.2309, "step": 12440 }, { "epoch": 0.31, "learning_rate": 0.002530814260231641, "loss": 0.2239, "step": 12450 }, { "epoch": 0.31, "learning_rate": 0.0025304374042157624, "loss": 0.2195, "step": 12460 }, { "epoch": 0.31, "learning_rate": 0.0025300605481998846, "loss": 0.2191, "step": 12470 }, { "epoch": 0.31, "learning_rate": 0.0025296836921840063, "loss": 0.2128, "step": 12480 }, { "epoch": 0.31, "learning_rate": 0.002529306836168128, "loss": 0.209, "step": 12490 }, { "epoch": 0.31, "learning_rate": 0.00252892998015225, "loss": 0.2066, "step": 12500 }, { "epoch": 0.31, "eval_cer": 0.6679375959753745, "eval_loss": 0.14948998391628265, "eval_runtime": 90.7588, "eval_samples_per_second": 110.171, "eval_steps_per_second": 6.886, "step": 12500 }, { "epoch": 0.31, "learning_rate": 0.0025285531241363715, "loss": 0.2081, "step": 12510 }, { "epoch": 0.31, "learning_rate": 0.0025281762681204933, "loss": 0.2056, "step": 12520 }, { "epoch": 0.31, "learning_rate": 0.0025277994121046155, "loss": 0.2009, "step": 12530 }, { "epoch": 0.32, "learning_rate": 0.0025274225560887368, "loss": 0.1993, "step": 12540 }, { "epoch": 0.32, "learning_rate": 0.002527045700072859, "loss": 0.1974, "step": 12550 }, { "epoch": 0.32, "learning_rate": 0.0025266688440569807, "loss": 0.1969, "step": 12560 }, { "epoch": 0.32, "learning_rate": 0.0025262919880411024, "loss": 0.1976, "step": 12570 }, { "epoch": 0.32, "learning_rate": 0.002525915132025224, "loss": 0.1909, "step": 12580 }, { "epoch": 0.32, "learning_rate": 0.002525538276009346, "loss": 0.1953, "step": 12590 }, { "epoch": 0.32, "learning_rate": 0.002525161419993468, "loss": 0.1904, "step": 12600 }, { "epoch": 0.32, "learning_rate": 0.00252478456397759, "loss": 0.1923, "step": 12610 }, { "epoch": 0.32, "learning_rate": 0.002524407707961711, "loss": 0.1899, "step": 12620 }, { "epoch": 0.32, "learning_rate": 0.0025240308519458333, "loss": 0.1873, "step": 12630 }, { "epoch": 0.32, "learning_rate": 0.002523653995929955, "loss": 0.1892, "step": 12640 }, { "epoch": 0.32, "learning_rate": 0.002523277139914077, "loss": 0.1862, "step": 12650 }, { "epoch": 0.32, "learning_rate": 0.0025229002838981986, "loss": 0.186, "step": 12660 }, { "epoch": 0.32, "learning_rate": 0.0025225234278823203, "loss": 0.182, "step": 12670 }, { "epoch": 0.32, "learning_rate": 0.0025221465718664425, "loss": 0.1819, "step": 12680 }, { "epoch": 0.32, "learning_rate": 0.002521769715850564, "loss": 0.1777, "step": 12690 }, { "epoch": 0.32, "learning_rate": 0.002521392859834686, "loss": 0.1781, "step": 12700 }, { "epoch": 0.32, "learning_rate": 0.0025210160038188077, "loss": 0.1827, "step": 12710 }, { "epoch": 0.32, "learning_rate": 0.0025206391478029295, "loss": 0.1773, "step": 12720 }, { "epoch": 0.32, "learning_rate": 0.0025202622917870512, "loss": 0.1813, "step": 12730 }, { "epoch": 0.32, "learning_rate": 0.002519885435771173, "loss": 0.1815, "step": 12740 }, { "epoch": 0.32, "learning_rate": 0.0025195085797552947, "loss": 0.1758, "step": 12750 }, { "epoch": 0.32, "learning_rate": 0.002519131723739417, "loss": 0.1794, "step": 12760 }, { "epoch": 0.32, "learning_rate": 0.002518754867723538, "loss": 0.1755, "step": 12770 }, { "epoch": 0.32, "learning_rate": 0.0025183780117076604, "loss": 0.1786, "step": 12780 }, { "epoch": 0.32, "learning_rate": 0.002518001155691782, "loss": 0.1749, "step": 12790 }, { "epoch": 0.32, "learning_rate": 0.002517624299675904, "loss": 0.174, "step": 12800 }, { "epoch": 0.32, "learning_rate": 0.0025172474436600256, "loss": 0.1782, "step": 12810 }, { "epoch": 0.32, "learning_rate": 0.0025168705876441474, "loss": 0.1763, "step": 12820 }, { "epoch": 0.32, "learning_rate": 0.0025164937316282695, "loss": 0.1749, "step": 12830 }, { "epoch": 0.32, "learning_rate": 0.0025161168756123913, "loss": 0.1728, "step": 12840 }, { "epoch": 0.32, "learning_rate": 0.0025157400195965126, "loss": 0.17, "step": 12850 }, { "epoch": 0.32, "learning_rate": 0.0025153631635806348, "loss": 0.1732, "step": 12860 }, { "epoch": 0.32, "learning_rate": 0.0025149863075647565, "loss": 0.1685, "step": 12870 }, { "epoch": 0.32, "learning_rate": 0.0025146094515488783, "loss": 0.1734, "step": 12880 }, { "epoch": 0.32, "learning_rate": 0.002514232595533, "loss": 0.1757, "step": 12890 }, { "epoch": 0.32, "learning_rate": 0.0025138557395171218, "loss": 0.1672, "step": 12900 }, { "epoch": 0.32, "learning_rate": 0.002513478883501244, "loss": 0.1718, "step": 12910 }, { "epoch": 0.32, "learning_rate": 0.0025131020274853652, "loss": 0.1732, "step": 12920 }, { "epoch": 0.32, "learning_rate": 0.002512725171469487, "loss": 0.1701, "step": 12930 }, { "epoch": 0.33, "learning_rate": 0.002512348315453609, "loss": 0.1653, "step": 12940 }, { "epoch": 0.33, "learning_rate": 0.002511971459437731, "loss": 0.1674, "step": 12950 }, { "epoch": 0.33, "learning_rate": 0.0025115946034218527, "loss": 0.1712, "step": 12960 }, { "epoch": 0.33, "learning_rate": 0.0025112177474059744, "loss": 0.1643, "step": 12970 }, { "epoch": 0.33, "learning_rate": 0.002510840891390096, "loss": 0.1636, "step": 12980 }, { "epoch": 0.33, "learning_rate": 0.0025104640353742183, "loss": 0.1633, "step": 12990 }, { "epoch": 0.33, "learning_rate": 0.0025100871793583396, "loss": 0.1654, "step": 13000 }, { "epoch": 0.33, "eval_cer": 0.6678427935998291, "eval_loss": 0.12283774465322495, "eval_runtime": 90.4365, "eval_samples_per_second": 110.564, "eval_steps_per_second": 6.911, "step": 13000 }, { "epoch": 0.33, "learning_rate": 0.002509710323342462, "loss": 0.169, "step": 13010 }, { "epoch": 0.33, "learning_rate": 0.0025093334673265836, "loss": 0.1637, "step": 13020 }, { "epoch": 0.33, "learning_rate": 0.0025089566113107053, "loss": 0.1614, "step": 13030 }, { "epoch": 0.33, "learning_rate": 0.002508579755294827, "loss": 0.1662, "step": 13040 }, { "epoch": 0.33, "learning_rate": 0.002508202899278949, "loss": 0.165, "step": 13050 }, { "epoch": 0.33, "learning_rate": 0.0025078260432630705, "loss": 0.1591, "step": 13060 }, { "epoch": 0.33, "learning_rate": 0.0025074491872471927, "loss": 0.1631, "step": 13070 }, { "epoch": 0.33, "learning_rate": 0.002507072331231314, "loss": 0.1596, "step": 13080 }, { "epoch": 0.33, "learning_rate": 0.002506695475215436, "loss": 0.1599, "step": 13090 }, { "epoch": 0.33, "learning_rate": 0.002506318619199558, "loss": 0.158, "step": 13100 }, { "epoch": 0.33, "learning_rate": 0.0025059417631836797, "loss": 0.1625, "step": 13110 }, { "epoch": 0.33, "learning_rate": 0.0025055649071678014, "loss": 0.1618, "step": 13120 }, { "epoch": 0.33, "learning_rate": 0.002505188051151923, "loss": 0.1655, "step": 13130 }, { "epoch": 0.33, "learning_rate": 0.0025048111951360454, "loss": 0.1585, "step": 13140 }, { "epoch": 0.33, "learning_rate": 0.0025044343391201667, "loss": 0.1597, "step": 13150 }, { "epoch": 0.33, "learning_rate": 0.0025040574831042884, "loss": 0.1604, "step": 13160 }, { "epoch": 0.33, "learning_rate": 0.0025036806270884106, "loss": 0.1563, "step": 13170 }, { "epoch": 0.33, "learning_rate": 0.0025033037710725323, "loss": 0.1571, "step": 13180 }, { "epoch": 0.33, "learning_rate": 0.002502926915056654, "loss": 0.1604, "step": 13190 }, { "epoch": 0.33, "learning_rate": 0.002502550059040776, "loss": 0.1669, "step": 13200 }, { "epoch": 0.33, "learning_rate": 0.0025021732030248976, "loss": 0.1606, "step": 13210 }, { "epoch": 0.33, "learning_rate": 0.0025017963470090198, "loss": 0.149, "step": 13220 }, { "epoch": 0.33, "learning_rate": 0.002501419490993141, "loss": 0.1592, "step": 13230 }, { "epoch": 0.33, "learning_rate": 0.0025010426349772632, "loss": 0.158, "step": 13240 }, { "epoch": 0.33, "learning_rate": 0.002500665778961385, "loss": 0.1601, "step": 13250 }, { "epoch": 0.33, "learning_rate": 0.0025002889229455067, "loss": 0.1525, "step": 13260 }, { "epoch": 0.33, "learning_rate": 0.0024999120669296285, "loss": 0.1606, "step": 13270 }, { "epoch": 0.33, "learning_rate": 0.0024995352109137502, "loss": 0.158, "step": 13280 }, { "epoch": 0.33, "learning_rate": 0.002499158354897872, "loss": 0.1574, "step": 13290 }, { "epoch": 0.33, "learning_rate": 0.002498781498881994, "loss": 0.1546, "step": 13300 }, { "epoch": 0.33, "learning_rate": 0.0024984046428661155, "loss": 0.1562, "step": 13310 }, { "epoch": 0.33, "learning_rate": 0.0024980277868502376, "loss": 0.1603, "step": 13320 }, { "epoch": 0.33, "learning_rate": 0.0024976509308343594, "loss": 0.1553, "step": 13330 }, { "epoch": 0.34, "learning_rate": 0.002497274074818481, "loss": 0.1568, "step": 13340 }, { "epoch": 0.34, "learning_rate": 0.002496897218802603, "loss": 0.1523, "step": 13350 }, { "epoch": 0.34, "learning_rate": 0.0024965203627867246, "loss": 0.1544, "step": 13360 }, { "epoch": 0.34, "learning_rate": 0.0024961435067708464, "loss": 0.1539, "step": 13370 }, { "epoch": 0.34, "learning_rate": 0.002495766650754968, "loss": 0.1557, "step": 13380 }, { "epoch": 0.34, "learning_rate": 0.00249538979473909, "loss": 0.1526, "step": 13390 }, { "epoch": 0.34, "learning_rate": 0.002495012938723212, "loss": 0.1537, "step": 13400 }, { "epoch": 0.34, "learning_rate": 0.0024946360827073338, "loss": 0.1574, "step": 13410 }, { "epoch": 0.34, "learning_rate": 0.0024942592266914555, "loss": 0.1555, "step": 13420 }, { "epoch": 0.34, "learning_rate": 0.0024938823706755773, "loss": 0.1528, "step": 13430 }, { "epoch": 0.34, "learning_rate": 0.002493505514659699, "loss": 0.1517, "step": 13440 }, { "epoch": 0.34, "learning_rate": 0.002493128658643821, "loss": 0.1604, "step": 13450 }, { "epoch": 0.34, "learning_rate": 0.0024927518026279425, "loss": 0.1541, "step": 13460 }, { "epoch": 0.34, "learning_rate": 0.0024923749466120642, "loss": 0.1515, "step": 13470 }, { "epoch": 0.34, "learning_rate": 0.0024919980905961864, "loss": 0.1506, "step": 13480 }, { "epoch": 0.34, "learning_rate": 0.002491621234580308, "loss": 0.1542, "step": 13490 }, { "epoch": 0.34, "learning_rate": 0.00249124437856443, "loss": 0.1552, "step": 13500 }, { "epoch": 0.34, "eval_cer": 0.667002084208571, "eval_loss": 0.11529998481273651, "eval_runtime": 90.608, "eval_samples_per_second": 110.355, "eval_steps_per_second": 6.898, "step": 13500 }, { "epoch": 0.34, "learning_rate": 0.0024908675225485516, "loss": 0.1555, "step": 13510 }, { "epoch": 0.34, "learning_rate": 0.0024904906665326734, "loss": 0.1503, "step": 13520 }, { "epoch": 0.34, "learning_rate": 0.0024901138105167956, "loss": 0.15, "step": 13530 }, { "epoch": 0.34, "learning_rate": 0.002489736954500917, "loss": 0.1545, "step": 13540 }, { "epoch": 0.34, "learning_rate": 0.002489360098485039, "loss": 0.1517, "step": 13550 }, { "epoch": 0.34, "learning_rate": 0.002488983242469161, "loss": 0.148, "step": 13560 }, { "epoch": 0.34, "learning_rate": 0.0024886063864532825, "loss": 0.1488, "step": 13570 }, { "epoch": 0.34, "learning_rate": 0.0024882295304374043, "loss": 0.1557, "step": 13580 }, { "epoch": 0.34, "learning_rate": 0.002487852674421526, "loss": 0.1546, "step": 13590 }, { "epoch": 0.34, "learning_rate": 0.0024874758184056478, "loss": 0.1531, "step": 13600 }, { "epoch": 0.34, "learning_rate": 0.0024870989623897695, "loss": 0.1531, "step": 13610 }, { "epoch": 0.34, "learning_rate": 0.0024867221063738913, "loss": 0.1513, "step": 13620 }, { "epoch": 0.34, "learning_rate": 0.0024863452503580134, "loss": 0.1519, "step": 13630 }, { "epoch": 0.34, "learning_rate": 0.002485968394342135, "loss": 0.1476, "step": 13640 }, { "epoch": 0.34, "learning_rate": 0.002485591538326257, "loss": 0.1527, "step": 13650 }, { "epoch": 0.34, "learning_rate": 0.0024852146823103787, "loss": 0.1544, "step": 13660 }, { "epoch": 0.34, "learning_rate": 0.0024848378262945004, "loss": 0.1496, "step": 13670 }, { "epoch": 0.34, "learning_rate": 0.0024844609702786226, "loss": 0.1513, "step": 13680 }, { "epoch": 0.34, "learning_rate": 0.002484084114262744, "loss": 0.1478, "step": 13690 }, { "epoch": 0.34, "learning_rate": 0.0024837072582468657, "loss": 0.1447, "step": 13700 }, { "epoch": 0.34, "learning_rate": 0.002483330402230988, "loss": 0.1524, "step": 13710 }, { "epoch": 0.34, "learning_rate": 0.0024829535462151096, "loss": 0.1535, "step": 13720 }, { "epoch": 0.34, "learning_rate": 0.0024825766901992313, "loss": 0.1486, "step": 13730 }, { "epoch": 0.35, "learning_rate": 0.002482199834183353, "loss": 0.1468, "step": 13740 }, { "epoch": 0.35, "learning_rate": 0.002481822978167475, "loss": 0.1505, "step": 13750 }, { "epoch": 0.35, "learning_rate": 0.002481446122151597, "loss": 0.1439, "step": 13760 }, { "epoch": 0.35, "learning_rate": 0.0024810692661357183, "loss": 0.1498, "step": 13770 }, { "epoch": 0.35, "learning_rate": 0.00248069241011984, "loss": 0.1507, "step": 13780 }, { "epoch": 0.35, "learning_rate": 0.0024803155541039622, "loss": 0.1455, "step": 13790 }, { "epoch": 0.35, "learning_rate": 0.0024799386980880835, "loss": 0.1438, "step": 13800 }, { "epoch": 0.35, "learning_rate": 0.0024795618420722057, "loss": 0.1513, "step": 13810 }, { "epoch": 0.35, "learning_rate": 0.0024791849860563275, "loss": 0.1477, "step": 13820 }, { "epoch": 0.35, "learning_rate": 0.002478808130040449, "loss": 0.1495, "step": 13830 }, { "epoch": 0.35, "learning_rate": 0.002478431274024571, "loss": 0.1464, "step": 13840 }, { "epoch": 0.35, "learning_rate": 0.0024780544180086927, "loss": 0.1432, "step": 13850 }, { "epoch": 0.35, "learning_rate": 0.002477677561992815, "loss": 0.1406, "step": 13860 }, { "epoch": 0.35, "learning_rate": 0.0024773007059769366, "loss": 0.1507, "step": 13870 }, { "epoch": 0.35, "learning_rate": 0.002476923849961058, "loss": 0.1433, "step": 13880 }, { "epoch": 0.35, "learning_rate": 0.00247654699394518, "loss": 0.1418, "step": 13890 }, { "epoch": 0.35, "learning_rate": 0.002476170137929302, "loss": 0.1437, "step": 13900 }, { "epoch": 0.35, "learning_rate": 0.0024757932819134236, "loss": 0.1461, "step": 13910 }, { "epoch": 0.35, "learning_rate": 0.0024754164258975453, "loss": 0.1473, "step": 13920 }, { "epoch": 0.35, "learning_rate": 0.002475039569881667, "loss": 0.1397, "step": 13930 }, { "epoch": 0.35, "learning_rate": 0.0024746627138657893, "loss": 0.1499, "step": 13940 }, { "epoch": 0.35, "learning_rate": 0.002474285857849911, "loss": 0.1454, "step": 13950 }, { "epoch": 0.35, "learning_rate": 0.0024739090018340328, "loss": 0.1452, "step": 13960 }, { "epoch": 0.35, "learning_rate": 0.0024735321458181545, "loss": 0.142, "step": 13970 }, { "epoch": 0.35, "learning_rate": 0.0024731552898022762, "loss": 0.1377, "step": 13980 }, { "epoch": 0.35, "learning_rate": 0.0024727784337863984, "loss": 0.1454, "step": 13990 }, { "epoch": 0.35, "learning_rate": 0.0024724015777705197, "loss": 0.1443, "step": 14000 }, { "epoch": 0.35, "eval_cer": 0.6669525174843011, "eval_loss": 0.11095242947340012, "eval_runtime": 90.4686, "eval_samples_per_second": 110.525, "eval_steps_per_second": 6.908, "step": 14000 }, { "epoch": 0.35, "learning_rate": 0.0024720247217546415, "loss": 0.1419, "step": 14010 }, { "epoch": 0.35, "learning_rate": 0.0024716478657387637, "loss": 0.1433, "step": 14020 }, { "epoch": 0.35, "learning_rate": 0.002471271009722885, "loss": 0.1403, "step": 14030 }, { "epoch": 0.35, "learning_rate": 0.002470894153707007, "loss": 0.1411, "step": 14040 }, { "epoch": 0.35, "learning_rate": 0.002470517297691129, "loss": 0.1438, "step": 14050 }, { "epoch": 0.35, "learning_rate": 0.0024701404416752506, "loss": 0.1491, "step": 14060 }, { "epoch": 0.35, "learning_rate": 0.0024697635856593724, "loss": 0.144, "step": 14070 }, { "epoch": 0.35, "learning_rate": 0.002469386729643494, "loss": 0.1426, "step": 14080 }, { "epoch": 0.35, "learning_rate": 0.0024690098736276163, "loss": 0.1418, "step": 14090 }, { "epoch": 0.35, "learning_rate": 0.002468633017611738, "loss": 0.1408, "step": 14100 }, { "epoch": 0.35, "learning_rate": 0.0024682561615958594, "loss": 0.146, "step": 14110 }, { "epoch": 0.35, "learning_rate": 0.0024678793055799815, "loss": 0.1426, "step": 14120 }, { "epoch": 0.35, "learning_rate": 0.0024675024495641033, "loss": 0.145, "step": 14130 }, { "epoch": 0.36, "learning_rate": 0.002467125593548225, "loss": 0.139, "step": 14140 }, { "epoch": 0.36, "learning_rate": 0.0024667487375323468, "loss": 0.1381, "step": 14150 }, { "epoch": 0.36, "learning_rate": 0.0024663718815164685, "loss": 0.1424, "step": 14160 }, { "epoch": 0.36, "learning_rate": 0.0024659950255005907, "loss": 0.1467, "step": 14170 }, { "epoch": 0.36, "learning_rate": 0.0024656181694847124, "loss": 0.1428, "step": 14180 }, { "epoch": 0.36, "learning_rate": 0.0024652413134688337, "loss": 0.1394, "step": 14190 }, { "epoch": 0.36, "learning_rate": 0.002464864457452956, "loss": 0.1443, "step": 14200 }, { "epoch": 0.36, "learning_rate": 0.0024644876014370777, "loss": 0.1398, "step": 14210 }, { "epoch": 0.36, "learning_rate": 0.0024641107454211994, "loss": 0.1463, "step": 14220 }, { "epoch": 0.36, "learning_rate": 0.002463733889405321, "loss": 0.1442, "step": 14230 }, { "epoch": 0.36, "learning_rate": 0.002463357033389443, "loss": 0.1421, "step": 14240 }, { "epoch": 0.36, "learning_rate": 0.002462980177373565, "loss": 0.1414, "step": 14250 }, { "epoch": 0.36, "learning_rate": 0.0024626033213576864, "loss": 0.1437, "step": 14260 }, { "epoch": 0.36, "learning_rate": 0.0024622264653418086, "loss": 0.1367, "step": 14270 }, { "epoch": 0.36, "learning_rate": 0.0024618496093259303, "loss": 0.1422, "step": 14280 }, { "epoch": 0.36, "learning_rate": 0.002461472753310052, "loss": 0.1452, "step": 14290 }, { "epoch": 0.36, "learning_rate": 0.002461095897294174, "loss": 0.1448, "step": 14300 }, { "epoch": 0.36, "learning_rate": 0.0024607190412782956, "loss": 0.1426, "step": 14310 }, { "epoch": 0.36, "learning_rate": 0.0024603421852624173, "loss": 0.138, "step": 14320 }, { "epoch": 0.36, "learning_rate": 0.0024599653292465395, "loss": 0.1415, "step": 14330 }, { "epoch": 0.36, "learning_rate": 0.002459588473230661, "loss": 0.1401, "step": 14340 }, { "epoch": 0.36, "learning_rate": 0.002459211617214783, "loss": 0.1424, "step": 14350 }, { "epoch": 0.36, "learning_rate": 0.0024588347611989047, "loss": 0.1391, "step": 14360 }, { "epoch": 0.36, "learning_rate": 0.0024584579051830265, "loss": 0.1413, "step": 14370 }, { "epoch": 0.36, "learning_rate": 0.002458081049167148, "loss": 0.139, "step": 14380 }, { "epoch": 0.36, "learning_rate": 0.00245770419315127, "loss": 0.1355, "step": 14390 }, { "epoch": 0.36, "learning_rate": 0.002457327337135392, "loss": 0.1426, "step": 14400 }, { "epoch": 0.36, "learning_rate": 0.002456950481119514, "loss": 0.1404, "step": 14410 }, { "epoch": 0.36, "learning_rate": 0.002456573625103635, "loss": 0.1383, "step": 14420 }, { "epoch": 0.36, "learning_rate": 0.0024561967690877574, "loss": 0.1378, "step": 14430 }, { "epoch": 0.36, "learning_rate": 0.002455819913071879, "loss": 0.1444, "step": 14440 }, { "epoch": 0.36, "learning_rate": 0.002455443057056001, "loss": 0.1368, "step": 14450 }, { "epoch": 0.36, "learning_rate": 0.0024550662010401226, "loss": 0.1395, "step": 14460 }, { "epoch": 0.36, "learning_rate": 0.0024546893450242443, "loss": 0.1366, "step": 14470 }, { "epoch": 0.36, "learning_rate": 0.0024543124890083665, "loss": 0.141, "step": 14480 }, { "epoch": 0.36, "learning_rate": 0.002453935632992488, "loss": 0.1415, "step": 14490 }, { "epoch": 0.36, "learning_rate": 0.00245355877697661, "loss": 0.1397, "step": 14500 }, { "epoch": 0.36, "eval_cer": 0.6669780226919351, "eval_loss": 0.10726305842399597, "eval_runtime": 90.529, "eval_samples_per_second": 110.451, "eval_steps_per_second": 6.904, "step": 14500 }, { "epoch": 0.36, "learning_rate": 0.0024531819209607317, "loss": 0.1349, "step": 14510 }, { "epoch": 0.36, "learning_rate": 0.0024528050649448535, "loss": 0.1399, "step": 14520 }, { "epoch": 0.37, "learning_rate": 0.0024524282089289752, "loss": 0.1368, "step": 14530 }, { "epoch": 0.37, "learning_rate": 0.002452051352913097, "loss": 0.1397, "step": 14540 }, { "epoch": 0.37, "learning_rate": 0.0024516744968972187, "loss": 0.1375, "step": 14550 }, { "epoch": 0.37, "learning_rate": 0.002451297640881341, "loss": 0.1395, "step": 14560 }, { "epoch": 0.37, "learning_rate": 0.002450920784865462, "loss": 0.1377, "step": 14570 }, { "epoch": 0.37, "learning_rate": 0.0024505439288495844, "loss": 0.1421, "step": 14580 }, { "epoch": 0.37, "learning_rate": 0.002450167072833706, "loss": 0.1413, "step": 14590 }, { "epoch": 0.37, "learning_rate": 0.002449790216817828, "loss": 0.1373, "step": 14600 }, { "epoch": 0.37, "learning_rate": 0.0024494133608019496, "loss": 0.137, "step": 14610 }, { "epoch": 0.37, "learning_rate": 0.0024490365047860714, "loss": 0.1361, "step": 14620 }, { "epoch": 0.37, "learning_rate": 0.002448659648770193, "loss": 0.1446, "step": 14630 }, { "epoch": 0.37, "learning_rate": 0.0024482827927543153, "loss": 0.1364, "step": 14640 }, { "epoch": 0.37, "learning_rate": 0.0024479059367384366, "loss": 0.141, "step": 14650 }, { "epoch": 0.37, "learning_rate": 0.0024475290807225588, "loss": 0.1425, "step": 14660 }, { "epoch": 0.37, "learning_rate": 0.0024471522247066805, "loss": 0.1365, "step": 14670 }, { "epoch": 0.37, "learning_rate": 0.0024467753686908023, "loss": 0.1399, "step": 14680 }, { "epoch": 0.37, "learning_rate": 0.002446398512674924, "loss": 0.1381, "step": 14690 }, { "epoch": 0.37, "learning_rate": 0.0024460216566590458, "loss": 0.1452, "step": 14700 }, { "epoch": 0.37, "learning_rate": 0.002445644800643168, "loss": 0.1399, "step": 14710 }, { "epoch": 0.37, "learning_rate": 0.0024452679446272893, "loss": 0.1397, "step": 14720 }, { "epoch": 0.37, "learning_rate": 0.002444891088611411, "loss": 0.1376, "step": 14730 }, { "epoch": 0.37, "learning_rate": 0.002444514232595533, "loss": 0.1356, "step": 14740 }, { "epoch": 0.37, "learning_rate": 0.002444137376579655, "loss": 0.1392, "step": 14750 }, { "epoch": 0.37, "learning_rate": 0.0024437605205637767, "loss": 0.1397, "step": 14760 }, { "epoch": 0.37, "learning_rate": 0.0024433836645478984, "loss": 0.1373, "step": 14770 }, { "epoch": 0.37, "learning_rate": 0.00244300680853202, "loss": 0.1353, "step": 14780 }, { "epoch": 0.37, "learning_rate": 0.0024426299525161423, "loss": 0.1384, "step": 14790 }, { "epoch": 0.37, "learning_rate": 0.0024422530965002636, "loss": 0.1426, "step": 14800 }, { "epoch": 0.37, "learning_rate": 0.002441876240484386, "loss": 0.1405, "step": 14810 }, { "epoch": 0.37, "learning_rate": 0.0024414993844685076, "loss": 0.1379, "step": 14820 }, { "epoch": 0.37, "learning_rate": 0.0024411225284526293, "loss": 0.1372, "step": 14830 }, { "epoch": 0.37, "learning_rate": 0.002440745672436751, "loss": 0.1399, "step": 14840 }, { "epoch": 0.37, "learning_rate": 0.002440368816420873, "loss": 0.1396, "step": 14850 }, { "epoch": 0.37, "learning_rate": 0.0024399919604049945, "loss": 0.1362, "step": 14860 }, { "epoch": 0.37, "learning_rate": 0.0024396151043891167, "loss": 0.1322, "step": 14870 }, { "epoch": 0.37, "learning_rate": 0.002439238248373238, "loss": 0.1324, "step": 14880 }, { "epoch": 0.37, "learning_rate": 0.00243886139235736, "loss": 0.1387, "step": 14890 }, { "epoch": 0.37, "learning_rate": 0.002438484536341482, "loss": 0.1387, "step": 14900 }, { "epoch": 0.37, "learning_rate": 0.0024381076803256037, "loss": 0.1393, "step": 14910 }, { "epoch": 0.37, "learning_rate": 0.0024377308243097254, "loss": 0.1387, "step": 14920 }, { "epoch": 0.38, "learning_rate": 0.002437353968293847, "loss": 0.1368, "step": 14930 }, { "epoch": 0.38, "learning_rate": 0.002436977112277969, "loss": 0.135, "step": 14940 }, { "epoch": 0.38, "learning_rate": 0.0024366002562620907, "loss": 0.1357, "step": 14950 }, { "epoch": 0.38, "learning_rate": 0.0024362234002462124, "loss": 0.1374, "step": 14960 }, { "epoch": 0.38, "learning_rate": 0.0024358465442303346, "loss": 0.1352, "step": 14970 }, { "epoch": 0.38, "learning_rate": 0.0024354696882144563, "loss": 0.1323, "step": 14980 }, { "epoch": 0.38, "learning_rate": 0.002435092832198578, "loss": 0.135, "step": 14990 }, { "epoch": 0.38, "learning_rate": 0.0024347159761827, "loss": 0.1366, "step": 15000 }, { "epoch": 0.38, "eval_cer": 0.666434232415964, "eval_loss": 0.10666073858737946, "eval_runtime": 90.0505, "eval_samples_per_second": 111.038, "eval_steps_per_second": 6.941, "step": 15000 }, { "epoch": 0.38, "learning_rate": 0.0024343391201668216, "loss": 0.1368, "step": 15010 }, { "epoch": 0.38, "learning_rate": 0.0024339622641509438, "loss": 0.1402, "step": 15020 }, { "epoch": 0.38, "learning_rate": 0.002433585408135065, "loss": 0.1406, "step": 15030 }, { "epoch": 0.38, "learning_rate": 0.002433208552119187, "loss": 0.1365, "step": 15040 }, { "epoch": 0.38, "learning_rate": 0.002432831696103309, "loss": 0.1391, "step": 15050 }, { "epoch": 0.38, "learning_rate": 0.0024324548400874307, "loss": 0.1397, "step": 15060 }, { "epoch": 0.38, "learning_rate": 0.0024320779840715525, "loss": 0.1336, "step": 15070 }, { "epoch": 0.38, "learning_rate": 0.0024317011280556742, "loss": 0.1392, "step": 15080 }, { "epoch": 0.38, "learning_rate": 0.002431324272039796, "loss": 0.1363, "step": 15090 }, { "epoch": 0.38, "learning_rate": 0.002430947416023918, "loss": 0.1367, "step": 15100 }, { "epoch": 0.38, "learning_rate": 0.0024305705600080395, "loss": 0.1324, "step": 15110 }, { "epoch": 0.38, "learning_rate": 0.0024301937039921616, "loss": 0.1361, "step": 15120 }, { "epoch": 0.38, "learning_rate": 0.0024298168479762834, "loss": 0.1381, "step": 15130 }, { "epoch": 0.38, "learning_rate": 0.0024294399919604047, "loss": 0.1354, "step": 15140 }, { "epoch": 0.38, "learning_rate": 0.002429063135944527, "loss": 0.1386, "step": 15150 }, { "epoch": 0.38, "learning_rate": 0.0024286862799286486, "loss": 0.132, "step": 15160 }, { "epoch": 0.38, "learning_rate": 0.0024283094239127704, "loss": 0.136, "step": 15170 }, { "epoch": 0.38, "learning_rate": 0.002427932567896892, "loss": 0.1359, "step": 15180 }, { "epoch": 0.38, "learning_rate": 0.002427555711881014, "loss": 0.1348, "step": 15190 }, { "epoch": 0.38, "learning_rate": 0.002427178855865136, "loss": 0.1383, "step": 15200 }, { "epoch": 0.38, "learning_rate": 0.0024268019998492578, "loss": 0.1339, "step": 15210 }, { "epoch": 0.38, "learning_rate": 0.0024264251438333795, "loss": 0.1309, "step": 15220 }, { "epoch": 0.38, "learning_rate": 0.0024260482878175013, "loss": 0.1417, "step": 15230 }, { "epoch": 0.38, "learning_rate": 0.002425671431801623, "loss": 0.138, "step": 15240 }, { "epoch": 0.38, "learning_rate": 0.002425294575785745, "loss": 0.1366, "step": 15250 }, { "epoch": 0.38, "learning_rate": 0.0024249177197698665, "loss": 0.1383, "step": 15260 }, { "epoch": 0.38, "learning_rate": 0.0024245408637539882, "loss": 0.1379, "step": 15270 }, { "epoch": 0.38, "learning_rate": 0.0024241640077381104, "loss": 0.1375, "step": 15280 }, { "epoch": 0.38, "learning_rate": 0.002423787151722232, "loss": 0.1372, "step": 15290 }, { "epoch": 0.38, "learning_rate": 0.002423410295706354, "loss": 0.1375, "step": 15300 }, { "epoch": 0.38, "learning_rate": 0.0024230334396904757, "loss": 0.1364, "step": 15310 }, { "epoch": 0.38, "learning_rate": 0.0024226565836745974, "loss": 0.1394, "step": 15320 }, { "epoch": 0.39, "learning_rate": 0.0024222797276587196, "loss": 0.137, "step": 15330 }, { "epoch": 0.39, "learning_rate": 0.002421902871642841, "loss": 0.1363, "step": 15340 }, { "epoch": 0.39, "learning_rate": 0.0024215260156269626, "loss": 0.1372, "step": 15350 }, { "epoch": 0.39, "learning_rate": 0.002421149159611085, "loss": 0.138, "step": 15360 }, { "epoch": 0.39, "learning_rate": 0.002420772303595206, "loss": 0.1351, "step": 15370 }, { "epoch": 0.39, "learning_rate": 0.0024203954475793283, "loss": 0.1379, "step": 15380 }, { "epoch": 0.39, "learning_rate": 0.00242001859156345, "loss": 0.1336, "step": 15390 }, { "epoch": 0.39, "learning_rate": 0.002419641735547572, "loss": 0.1313, "step": 15400 }, { "epoch": 0.39, "learning_rate": 0.0024192648795316935, "loss": 0.1377, "step": 15410 }, { "epoch": 0.39, "learning_rate": 0.0024188880235158153, "loss": 0.1355, "step": 15420 }, { "epoch": 0.39, "learning_rate": 0.0024185111674999375, "loss": 0.1379, "step": 15430 }, { "epoch": 0.39, "learning_rate": 0.002418134311484059, "loss": 0.1331, "step": 15440 }, { "epoch": 0.39, "learning_rate": 0.0024177574554681805, "loss": 0.1373, "step": 15450 }, { "epoch": 0.39, "learning_rate": 0.0024173805994523027, "loss": 0.1377, "step": 15460 }, { "epoch": 0.39, "learning_rate": 0.0024170037434364244, "loss": 0.1359, "step": 15470 }, { "epoch": 0.39, "learning_rate": 0.002416626887420546, "loss": 0.1315, "step": 15480 }, { "epoch": 0.39, "learning_rate": 0.002416250031404668, "loss": 0.1301, "step": 15490 }, { "epoch": 0.39, "learning_rate": 0.0024158731753887897, "loss": 0.1362, "step": 15500 }, { "epoch": 0.39, "eval_cer": 0.6669188313610108, "eval_loss": 0.10428140312433243, "eval_runtime": 90.5923, "eval_samples_per_second": 110.374, "eval_steps_per_second": 6.899, "step": 15500 }, { "epoch": 0.39, "learning_rate": 0.002415496319372912, "loss": 0.1352, "step": 15510 }, { "epoch": 0.39, "learning_rate": 0.0024151194633570336, "loss": 0.1348, "step": 15520 }, { "epoch": 0.39, "learning_rate": 0.0024147426073411553, "loss": 0.1319, "step": 15530 }, { "epoch": 0.39, "learning_rate": 0.002414365751325277, "loss": 0.1349, "step": 15540 }, { "epoch": 0.39, "learning_rate": 0.002413988895309399, "loss": 0.1315, "step": 15550 }, { "epoch": 0.39, "learning_rate": 0.002413612039293521, "loss": 0.1331, "step": 15560 }, { "epoch": 0.39, "learning_rate": 0.0024132351832776423, "loss": 0.1334, "step": 15570 }, { "epoch": 0.39, "learning_rate": 0.002412858327261764, "loss": 0.1362, "step": 15580 }, { "epoch": 0.39, "learning_rate": 0.0024124814712458862, "loss": 0.1359, "step": 15590 }, { "epoch": 0.39, "learning_rate": 0.0024121046152300075, "loss": 0.1322, "step": 15600 }, { "epoch": 0.39, "learning_rate": 0.0024117277592141297, "loss": 0.1318, "step": 15610 }, { "epoch": 0.39, "learning_rate": 0.0024113509031982515, "loss": 0.1382, "step": 15620 }, { "epoch": 0.39, "learning_rate": 0.002410974047182373, "loss": 0.1368, "step": 15630 }, { "epoch": 0.39, "learning_rate": 0.002410597191166495, "loss": 0.1303, "step": 15640 }, { "epoch": 0.39, "learning_rate": 0.0024102203351506167, "loss": 0.1356, "step": 15650 }, { "epoch": 0.39, "learning_rate": 0.002409843479134739, "loss": 0.1349, "step": 15660 }, { "epoch": 0.39, "learning_rate": 0.0024094666231188606, "loss": 0.1313, "step": 15670 }, { "epoch": 0.39, "learning_rate": 0.002409089767102982, "loss": 0.13, "step": 15680 }, { "epoch": 0.39, "learning_rate": 0.002408712911087104, "loss": 0.1347, "step": 15690 }, { "epoch": 0.39, "learning_rate": 0.002408336055071226, "loss": 0.1337, "step": 15700 }, { "epoch": 0.39, "learning_rate": 0.0024079591990553476, "loss": 0.1349, "step": 15710 }, { "epoch": 0.39, "learning_rate": 0.0024075823430394694, "loss": 0.132, "step": 15720 }, { "epoch": 0.4, "learning_rate": 0.002407205487023591, "loss": 0.1344, "step": 15730 }, { "epoch": 0.4, "learning_rate": 0.0024068286310077133, "loss": 0.1321, "step": 15740 }, { "epoch": 0.4, "learning_rate": 0.002406451774991835, "loss": 0.1306, "step": 15750 }, { "epoch": 0.4, "learning_rate": 0.0024060749189759563, "loss": 0.1325, "step": 15760 }, { "epoch": 0.4, "learning_rate": 0.0024056980629600785, "loss": 0.1307, "step": 15770 }, { "epoch": 0.4, "learning_rate": 0.0024053212069442003, "loss": 0.1312, "step": 15780 }, { "epoch": 0.4, "learning_rate": 0.002404944350928322, "loss": 0.133, "step": 15790 }, { "epoch": 0.4, "learning_rate": 0.0024045674949124437, "loss": 0.1328, "step": 15800 }, { "epoch": 0.4, "learning_rate": 0.0024041906388965655, "loss": 0.1337, "step": 15810 }, { "epoch": 0.4, "learning_rate": 0.0024038137828806877, "loss": 0.1288, "step": 15820 }, { "epoch": 0.4, "learning_rate": 0.002403436926864809, "loss": 0.1336, "step": 15830 }, { "epoch": 0.4, "learning_rate": 0.002403060070848931, "loss": 0.1361, "step": 15840 }, { "epoch": 0.4, "learning_rate": 0.002402683214833053, "loss": 0.1311, "step": 15850 }, { "epoch": 0.4, "learning_rate": 0.0024023063588171746, "loss": 0.1308, "step": 15860 }, { "epoch": 0.4, "learning_rate": 0.0024019295028012964, "loss": 0.1331, "step": 15870 }, { "epoch": 0.4, "learning_rate": 0.002401552646785418, "loss": 0.1337, "step": 15880 }, { "epoch": 0.4, "learning_rate": 0.00240117579076954, "loss": 0.1339, "step": 15890 }, { "epoch": 0.4, "learning_rate": 0.002400798934753662, "loss": 0.1303, "step": 15900 }, { "epoch": 0.4, "learning_rate": 0.0024004220787377834, "loss": 0.1286, "step": 15910 }, { "epoch": 0.4, "learning_rate": 0.0024000452227219055, "loss": 0.1352, "step": 15920 }, { "epoch": 0.4, "learning_rate": 0.0023996683667060273, "loss": 0.1322, "step": 15930 }, { "epoch": 0.4, "learning_rate": 0.002399291510690149, "loss": 0.1314, "step": 15940 }, { "epoch": 0.4, "learning_rate": 0.0023989146546742708, "loss": 0.1326, "step": 15950 }, { "epoch": 0.4, "learning_rate": 0.0023985377986583925, "loss": 0.1248, "step": 15960 }, { "epoch": 0.4, "learning_rate": 0.0023981609426425147, "loss": 0.1372, "step": 15970 }, { "epoch": 0.4, "learning_rate": 0.0023977840866266364, "loss": 0.1297, "step": 15980 }, { "epoch": 0.4, "learning_rate": 0.0023974072306107578, "loss": 0.1284, "step": 15990 }, { "epoch": 0.4, "learning_rate": 0.00239703037459488, "loss": 0.1375, "step": 16000 }, { "epoch": 0.4, "eval_cer": 0.6667884179408443, "eval_loss": 0.10115189850330353, "eval_runtime": 90.5383, "eval_samples_per_second": 110.439, "eval_steps_per_second": 6.903, "step": 16000 }, { "epoch": 0.4, "learning_rate": 0.0023966535185790017, "loss": 0.1304, "step": 16010 }, { "epoch": 0.4, "learning_rate": 0.0023962766625631234, "loss": 0.1332, "step": 16020 }, { "epoch": 0.4, "learning_rate": 0.002395899806547245, "loss": 0.1248, "step": 16030 }, { "epoch": 0.4, "learning_rate": 0.002395522950531367, "loss": 0.1352, "step": 16040 }, { "epoch": 0.4, "learning_rate": 0.002395146094515489, "loss": 0.1351, "step": 16050 }, { "epoch": 0.4, "learning_rate": 0.0023947692384996104, "loss": 0.1287, "step": 16060 }, { "epoch": 0.4, "learning_rate": 0.0023943923824837326, "loss": 0.1347, "step": 16070 }, { "epoch": 0.4, "learning_rate": 0.0023940155264678543, "loss": 0.129, "step": 16080 }, { "epoch": 0.4, "learning_rate": 0.002393638670451976, "loss": 0.1308, "step": 16090 }, { "epoch": 0.4, "learning_rate": 0.002393261814436098, "loss": 0.1314, "step": 16100 }, { "epoch": 0.4, "learning_rate": 0.0023928849584202196, "loss": 0.1307, "step": 16110 }, { "epoch": 0.4, "learning_rate": 0.0023925081024043413, "loss": 0.1281, "step": 16120 }, { "epoch": 0.41, "learning_rate": 0.0023921312463884635, "loss": 0.1255, "step": 16130 }, { "epoch": 0.41, "learning_rate": 0.002391754390372585, "loss": 0.1315, "step": 16140 }, { "epoch": 0.41, "learning_rate": 0.002391377534356707, "loss": 0.1308, "step": 16150 }, { "epoch": 0.41, "learning_rate": 0.0023910006783408287, "loss": 0.1296, "step": 16160 }, { "epoch": 0.41, "learning_rate": 0.0023906238223249505, "loss": 0.1326, "step": 16170 }, { "epoch": 0.41, "learning_rate": 0.002390246966309072, "loss": 0.1309, "step": 16180 }, { "epoch": 0.41, "learning_rate": 0.002389870110293194, "loss": 0.1344, "step": 16190 }, { "epoch": 0.41, "learning_rate": 0.0023894932542773157, "loss": 0.131, "step": 16200 }, { "epoch": 0.41, "learning_rate": 0.002389116398261438, "loss": 0.1335, "step": 16210 }, { "epoch": 0.41, "learning_rate": 0.002388739542245559, "loss": 0.1325, "step": 16220 }, { "epoch": 0.41, "learning_rate": 0.0023883626862296814, "loss": 0.131, "step": 16230 }, { "epoch": 0.41, "learning_rate": 0.002387985830213803, "loss": 0.132, "step": 16240 }, { "epoch": 0.41, "learning_rate": 0.002387608974197925, "loss": 0.1291, "step": 16250 }, { "epoch": 0.41, "learning_rate": 0.0023872321181820466, "loss": 0.1333, "step": 16260 }, { "epoch": 0.41, "learning_rate": 0.0023868552621661683, "loss": 0.1288, "step": 16270 }, { "epoch": 0.41, "learning_rate": 0.0023864784061502905, "loss": 0.135, "step": 16280 }, { "epoch": 0.41, "learning_rate": 0.002386101550134412, "loss": 0.1296, "step": 16290 }, { "epoch": 0.41, "learning_rate": 0.0023857246941185336, "loss": 0.1361, "step": 16300 }, { "epoch": 0.41, "learning_rate": 0.0023853478381026558, "loss": 0.1353, "step": 16310 }, { "epoch": 0.41, "learning_rate": 0.0023849709820867775, "loss": 0.1296, "step": 16320 }, { "epoch": 0.41, "learning_rate": 0.0023845941260708992, "loss": 0.131, "step": 16330 }, { "epoch": 0.41, "learning_rate": 0.002384217270055021, "loss": 0.126, "step": 16340 }, { "epoch": 0.41, "learning_rate": 0.0023838404140391427, "loss": 0.1299, "step": 16350 }, { "epoch": 0.41, "learning_rate": 0.002383463558023265, "loss": 0.1355, "step": 16360 }, { "epoch": 0.41, "learning_rate": 0.0023830867020073862, "loss": 0.1266, "step": 16370 }, { "epoch": 0.41, "learning_rate": 0.0023827098459915084, "loss": 0.129, "step": 16380 }, { "epoch": 0.41, "learning_rate": 0.00238233298997563, "loss": 0.1271, "step": 16390 }, { "epoch": 0.41, "learning_rate": 0.002381956133959752, "loss": 0.1268, "step": 16400 }, { "epoch": 0.41, "learning_rate": 0.0023815792779438736, "loss": 0.1308, "step": 16410 }, { "epoch": 0.41, "learning_rate": 0.0023812024219279954, "loss": 0.1335, "step": 16420 }, { "epoch": 0.41, "learning_rate": 0.002380825565912117, "loss": 0.13, "step": 16430 }, { "epoch": 0.41, "learning_rate": 0.0023804487098962393, "loss": 0.1295, "step": 16440 }, { "epoch": 0.41, "learning_rate": 0.0023800718538803606, "loss": 0.1331, "step": 16450 }, { "epoch": 0.41, "learning_rate": 0.002379694997864483, "loss": 0.1305, "step": 16460 }, { "epoch": 0.41, "learning_rate": 0.0023793181418486045, "loss": 0.127, "step": 16470 }, { "epoch": 0.41, "learning_rate": 0.0023789412858327263, "loss": 0.1286, "step": 16480 }, { "epoch": 0.41, "learning_rate": 0.002378564429816848, "loss": 0.1325, "step": 16490 }, { "epoch": 0.41, "learning_rate": 0.0023781875738009698, "loss": 0.1325, "step": 16500 }, { "epoch": 0.41, "eval_cer": 0.6672475116782571, "eval_loss": 0.09959594905376434, "eval_runtime": 90.384, "eval_samples_per_second": 110.628, "eval_steps_per_second": 6.915, "step": 16500 }, { "epoch": 0.41, "learning_rate": 0.0023778107177850915, "loss": 0.1236, "step": 16510 }, { "epoch": 0.42, "learning_rate": 0.0023774338617692133, "loss": 0.1281, "step": 16520 }, { "epoch": 0.42, "learning_rate": 0.002377057005753335, "loss": 0.1294, "step": 16530 }, { "epoch": 0.42, "learning_rate": 0.002376680149737457, "loss": 0.129, "step": 16540 }, { "epoch": 0.42, "learning_rate": 0.002376303293721579, "loss": 0.1296, "step": 16550 }, { "epoch": 0.42, "learning_rate": 0.0023759264377057007, "loss": 0.1235, "step": 16560 }, { "epoch": 0.42, "learning_rate": 0.0023755495816898224, "loss": 0.132, "step": 16570 }, { "epoch": 0.42, "learning_rate": 0.002375172725673944, "loss": 0.1317, "step": 16580 }, { "epoch": 0.42, "learning_rate": 0.0023747958696580663, "loss": 0.1299, "step": 16590 }, { "epoch": 0.42, "learning_rate": 0.0023744190136421876, "loss": 0.1312, "step": 16600 }, { "epoch": 0.42, "learning_rate": 0.0023740421576263094, "loss": 0.1296, "step": 16610 }, { "epoch": 0.42, "learning_rate": 0.0023736653016104316, "loss": 0.1294, "step": 16620 }, { "epoch": 0.42, "learning_rate": 0.0023732884455945533, "loss": 0.1285, "step": 16630 }, { "epoch": 0.42, "learning_rate": 0.002372911589578675, "loss": 0.1263, "step": 16640 }, { "epoch": 0.42, "learning_rate": 0.002372534733562797, "loss": 0.126, "step": 16650 }, { "epoch": 0.42, "learning_rate": 0.0023721578775469186, "loss": 0.132, "step": 16660 }, { "epoch": 0.42, "learning_rate": 0.0023717810215310407, "loss": 0.1263, "step": 16670 }, { "epoch": 0.42, "learning_rate": 0.002371404165515162, "loss": 0.1259, "step": 16680 }, { "epoch": 0.42, "learning_rate": 0.0023710273094992842, "loss": 0.1279, "step": 16690 }, { "epoch": 0.42, "learning_rate": 0.002370650453483406, "loss": 0.1294, "step": 16700 }, { "epoch": 0.42, "learning_rate": 0.0023702735974675273, "loss": 0.1265, "step": 16710 }, { "epoch": 0.42, "learning_rate": 0.0023698967414516495, "loss": 0.1238, "step": 16720 }, { "epoch": 0.42, "learning_rate": 0.002369519885435771, "loss": 0.1275, "step": 16730 }, { "epoch": 0.42, "learning_rate": 0.002369143029419893, "loss": 0.1314, "step": 16740 }, { "epoch": 0.42, "learning_rate": 0.0023687661734040147, "loss": 0.1291, "step": 16750 }, { "epoch": 0.42, "learning_rate": 0.0023683893173881364, "loss": 0.1285, "step": 16760 }, { "epoch": 0.42, "learning_rate": 0.0023680124613722586, "loss": 0.1266, "step": 16770 }, { "epoch": 0.42, "learning_rate": 0.0023676356053563804, "loss": 0.1264, "step": 16780 }, { "epoch": 0.42, "learning_rate": 0.002367258749340502, "loss": 0.1287, "step": 16790 }, { "epoch": 0.42, "learning_rate": 0.002366881893324624, "loss": 0.1263, "step": 16800 }, { "epoch": 0.42, "learning_rate": 0.0023665050373087456, "loss": 0.1273, "step": 16810 }, { "epoch": 0.42, "learning_rate": 0.0023661281812928678, "loss": 0.1295, "step": 16820 }, { "epoch": 0.42, "learning_rate": 0.002365751325276989, "loss": 0.1266, "step": 16830 }, { "epoch": 0.42, "learning_rate": 0.002365374469261111, "loss": 0.1238, "step": 16840 }, { "epoch": 0.42, "learning_rate": 0.002364997613245233, "loss": 0.1303, "step": 16850 }, { "epoch": 0.42, "learning_rate": 0.0023646207572293547, "loss": 0.1264, "step": 16860 }, { "epoch": 0.42, "learning_rate": 0.0023642439012134765, "loss": 0.1264, "step": 16870 }, { "epoch": 0.42, "learning_rate": 0.0023638670451975982, "loss": 0.1284, "step": 16880 }, { "epoch": 0.42, "learning_rate": 0.00236349018918172, "loss": 0.1287, "step": 16890 }, { "epoch": 0.42, "learning_rate": 0.002363113333165842, "loss": 0.1283, "step": 16900 }, { "epoch": 0.42, "learning_rate": 0.0023627364771499635, "loss": 0.1314, "step": 16910 }, { "epoch": 0.43, "learning_rate": 0.002362359621134085, "loss": 0.1295, "step": 16920 }, { "epoch": 0.43, "learning_rate": 0.0023619827651182074, "loss": 0.1247, "step": 16930 }, { "epoch": 0.43, "learning_rate": 0.0023616059091023287, "loss": 0.1302, "step": 16940 }, { "epoch": 0.43, "learning_rate": 0.002361229053086451, "loss": 0.1249, "step": 16950 }, { "epoch": 0.43, "learning_rate": 0.0023608521970705726, "loss": 0.1342, "step": 16960 }, { "epoch": 0.43, "learning_rate": 0.0023604753410546944, "loss": 0.1287, "step": 16970 }, { "epoch": 0.43, "learning_rate": 0.002360098485038816, "loss": 0.1265, "step": 16980 }, { "epoch": 0.43, "learning_rate": 0.002359721629022938, "loss": 0.1266, "step": 16990 }, { "epoch": 0.43, "learning_rate": 0.00235934477300706, "loss": 0.1277, "step": 17000 }, { "epoch": 0.43, "eval_cer": 0.6664294201126367, "eval_loss": 0.0992693156003952, "eval_runtime": 89.9278, "eval_samples_per_second": 111.189, "eval_steps_per_second": 6.95, "step": 17000 }, { "epoch": 0.43, "learning_rate": 0.0023589679169911818, "loss": 0.1268, "step": 17010 }, { "epoch": 0.43, "learning_rate": 0.002358591060975303, "loss": 0.1255, "step": 17020 }, { "epoch": 0.43, "learning_rate": 0.0023582142049594253, "loss": 0.1296, "step": 17030 }, { "epoch": 0.43, "learning_rate": 0.002357837348943547, "loss": 0.1273, "step": 17040 }, { "epoch": 0.43, "learning_rate": 0.0023574604929276688, "loss": 0.1304, "step": 17050 }, { "epoch": 0.43, "learning_rate": 0.0023570836369117905, "loss": 0.1262, "step": 17060 }, { "epoch": 0.43, "learning_rate": 0.0023567067808959122, "loss": 0.1257, "step": 17070 }, { "epoch": 0.43, "learning_rate": 0.0023563299248800344, "loss": 0.1275, "step": 17080 }, { "epoch": 0.43, "learning_rate": 0.002355953068864156, "loss": 0.1241, "step": 17090 }, { "epoch": 0.43, "learning_rate": 0.002355576212848278, "loss": 0.126, "step": 17100 }, { "epoch": 0.43, "learning_rate": 0.0023551993568323997, "loss": 0.1239, "step": 17110 }, { "epoch": 0.43, "learning_rate": 0.0023548225008165214, "loss": 0.1276, "step": 17120 }, { "epoch": 0.43, "learning_rate": 0.0023544456448006436, "loss": 0.127, "step": 17130 }, { "epoch": 0.43, "learning_rate": 0.002354068788784765, "loss": 0.1229, "step": 17140 }, { "epoch": 0.43, "learning_rate": 0.0023536919327688866, "loss": 0.1245, "step": 17150 }, { "epoch": 0.43, "learning_rate": 0.002353315076753009, "loss": 0.1276, "step": 17160 }, { "epoch": 0.43, "learning_rate": 0.00235293822073713, "loss": 0.1289, "step": 17170 }, { "epoch": 0.43, "learning_rate": 0.0023525613647212523, "loss": 0.1231, "step": 17180 }, { "epoch": 0.43, "learning_rate": 0.002352184508705374, "loss": 0.1289, "step": 17190 }, { "epoch": 0.43, "learning_rate": 0.002351807652689496, "loss": 0.1239, "step": 17200 }, { "epoch": 0.43, "learning_rate": 0.0023514307966736175, "loss": 0.1276, "step": 17210 }, { "epoch": 0.43, "learning_rate": 0.0023510539406577393, "loss": 0.1261, "step": 17220 }, { "epoch": 0.43, "learning_rate": 0.0023506770846418615, "loss": 0.13, "step": 17230 }, { "epoch": 0.43, "learning_rate": 0.002350300228625983, "loss": 0.1246, "step": 17240 }, { "epoch": 0.43, "learning_rate": 0.0023499233726101045, "loss": 0.1247, "step": 17250 }, { "epoch": 0.43, "learning_rate": 0.0023495465165942267, "loss": 0.1258, "step": 17260 }, { "epoch": 0.43, "learning_rate": 0.0023491696605783484, "loss": 0.1278, "step": 17270 }, { "epoch": 0.43, "learning_rate": 0.00234879280456247, "loss": 0.1273, "step": 17280 }, { "epoch": 0.43, "learning_rate": 0.002348415948546592, "loss": 0.1286, "step": 17290 }, { "epoch": 0.43, "learning_rate": 0.0023480390925307137, "loss": 0.1257, "step": 17300 }, { "epoch": 0.43, "learning_rate": 0.002347662236514836, "loss": 0.1244, "step": 17310 }, { "epoch": 0.44, "learning_rate": 0.0023472853804989576, "loss": 0.1232, "step": 17320 }, { "epoch": 0.44, "learning_rate": 0.002346908524483079, "loss": 0.1284, "step": 17330 }, { "epoch": 0.44, "learning_rate": 0.002346531668467201, "loss": 0.1194, "step": 17340 }, { "epoch": 0.44, "learning_rate": 0.002346154812451323, "loss": 0.13, "step": 17350 }, { "epoch": 0.44, "learning_rate": 0.0023457779564354446, "loss": 0.1288, "step": 17360 }, { "epoch": 0.44, "learning_rate": 0.0023454011004195663, "loss": 0.1264, "step": 17370 }, { "epoch": 0.44, "learning_rate": 0.002345024244403688, "loss": 0.1265, "step": 17380 }, { "epoch": 0.44, "learning_rate": 0.0023446473883878102, "loss": 0.1252, "step": 17390 }, { "epoch": 0.44, "learning_rate": 0.0023442705323719316, "loss": 0.1218, "step": 17400 }, { "epoch": 0.44, "learning_rate": 0.0023438936763560537, "loss": 0.1263, "step": 17410 }, { "epoch": 0.44, "learning_rate": 0.0023435168203401755, "loss": 0.1277, "step": 17420 }, { "epoch": 0.44, "learning_rate": 0.0023431399643242972, "loss": 0.1216, "step": 17430 }, { "epoch": 0.44, "learning_rate": 0.002342763108308419, "loss": 0.1234, "step": 17440 }, { "epoch": 0.44, "learning_rate": 0.0023423862522925407, "loss": 0.1257, "step": 17450 }, { "epoch": 0.44, "learning_rate": 0.0023420093962766625, "loss": 0.128, "step": 17460 }, { "epoch": 0.44, "learning_rate": 0.0023416325402607846, "loss": 0.123, "step": 17470 }, { "epoch": 0.44, "learning_rate": 0.002341255684244906, "loss": 0.1204, "step": 17480 }, { "epoch": 0.44, "learning_rate": 0.002340878828229028, "loss": 0.1233, "step": 17490 }, { "epoch": 0.44, "learning_rate": 0.00234050197221315, "loss": 0.1261, "step": 17500 }, { "epoch": 0.44, "eval_cer": 0.6667470321322305, "eval_loss": 0.09771975874900818, "eval_runtime": 90.5027, "eval_samples_per_second": 110.483, "eval_steps_per_second": 6.906, "step": 17500 }, { "epoch": 0.44, "learning_rate": 0.0023401251161972716, "loss": 0.1238, "step": 17510 }, { "epoch": 0.44, "learning_rate": 0.0023397482601813934, "loss": 0.1288, "step": 17520 }, { "epoch": 0.44, "learning_rate": 0.002339371404165515, "loss": 0.1262, "step": 17530 }, { "epoch": 0.44, "learning_rate": 0.0023389945481496373, "loss": 0.1228, "step": 17540 }, { "epoch": 0.44, "learning_rate": 0.002338617692133759, "loss": 0.1256, "step": 17550 }, { "epoch": 0.44, "learning_rate": 0.0023382408361178803, "loss": 0.1243, "step": 17560 }, { "epoch": 0.44, "learning_rate": 0.0023378639801020025, "loss": 0.1237, "step": 17570 }, { "epoch": 0.44, "learning_rate": 0.0023374871240861243, "loss": 0.1283, "step": 17580 }, { "epoch": 0.44, "learning_rate": 0.002337110268070246, "loss": 0.1226, "step": 17590 }, { "epoch": 0.44, "learning_rate": 0.0023367334120543677, "loss": 0.1264, "step": 17600 }, { "epoch": 0.44, "learning_rate": 0.0023363565560384895, "loss": 0.1233, "step": 17610 }, { "epoch": 0.44, "learning_rate": 0.0023359797000226117, "loss": 0.128, "step": 17620 }, { "epoch": 0.44, "learning_rate": 0.002335602844006733, "loss": 0.1229, "step": 17630 }, { "epoch": 0.44, "learning_rate": 0.002335225987990855, "loss": 0.122, "step": 17640 }, { "epoch": 0.44, "learning_rate": 0.002334849131974977, "loss": 0.1308, "step": 17650 }, { "epoch": 0.44, "learning_rate": 0.0023344722759590987, "loss": 0.1234, "step": 17660 }, { "epoch": 0.44, "learning_rate": 0.0023340954199432204, "loss": 0.1256, "step": 17670 }, { "epoch": 0.44, "learning_rate": 0.002333718563927342, "loss": 0.1232, "step": 17680 }, { "epoch": 0.44, "learning_rate": 0.002333341707911464, "loss": 0.1286, "step": 17690 }, { "epoch": 0.44, "learning_rate": 0.002332964851895586, "loss": 0.1266, "step": 17700 }, { "epoch": 0.44, "learning_rate": 0.0023325879958797074, "loss": 0.1291, "step": 17710 }, { "epoch": 0.45, "learning_rate": 0.0023322111398638296, "loss": 0.1222, "step": 17720 }, { "epoch": 0.45, "learning_rate": 0.0023318342838479513, "loss": 0.1305, "step": 17730 }, { "epoch": 0.45, "learning_rate": 0.002331457427832073, "loss": 0.1229, "step": 17740 }, { "epoch": 0.45, "learning_rate": 0.002331080571816195, "loss": 0.1247, "step": 17750 }, { "epoch": 0.45, "learning_rate": 0.0023307037158003165, "loss": 0.1236, "step": 17760 }, { "epoch": 0.45, "learning_rate": 0.0023303268597844383, "loss": 0.1223, "step": 17770 }, { "epoch": 0.45, "learning_rate": 0.0023299500037685605, "loss": 0.1233, "step": 17780 }, { "epoch": 0.45, "learning_rate": 0.0023295731477526818, "loss": 0.1242, "step": 17790 }, { "epoch": 0.45, "learning_rate": 0.002329196291736804, "loss": 0.1234, "step": 17800 }, { "epoch": 0.45, "learning_rate": 0.0023288194357209257, "loss": 0.125, "step": 17810 }, { "epoch": 0.45, "learning_rate": 0.0023284425797050474, "loss": 0.1259, "step": 17820 }, { "epoch": 0.45, "learning_rate": 0.002328065723689169, "loss": 0.1273, "step": 17830 }, { "epoch": 0.45, "learning_rate": 0.002327688867673291, "loss": 0.1222, "step": 17840 }, { "epoch": 0.45, "learning_rate": 0.002327312011657413, "loss": 0.1231, "step": 17850 }, { "epoch": 0.45, "learning_rate": 0.0023269351556415344, "loss": 0.127, "step": 17860 }, { "epoch": 0.45, "learning_rate": 0.002326558299625656, "loss": 0.1236, "step": 17870 }, { "epoch": 0.45, "learning_rate": 0.0023261814436097783, "loss": 0.121, "step": 17880 }, { "epoch": 0.45, "learning_rate": 0.0023258045875939, "loss": 0.1251, "step": 17890 }, { "epoch": 0.45, "learning_rate": 0.002325427731578022, "loss": 0.1245, "step": 17900 }, { "epoch": 0.45, "learning_rate": 0.0023250508755621436, "loss": 0.123, "step": 17910 }, { "epoch": 0.45, "learning_rate": 0.0023246740195462653, "loss": 0.1223, "step": 17920 }, { "epoch": 0.45, "learning_rate": 0.0023242971635303875, "loss": 0.1253, "step": 17930 }, { "epoch": 0.45, "learning_rate": 0.002323920307514509, "loss": 0.1272, "step": 17940 }, { "epoch": 0.45, "learning_rate": 0.002323543451498631, "loss": 0.1252, "step": 17950 }, { "epoch": 0.45, "learning_rate": 0.0023231665954827527, "loss": 0.1234, "step": 17960 }, { "epoch": 0.45, "learning_rate": 0.0023227897394668745, "loss": 0.1189, "step": 17970 }, { "epoch": 0.45, "learning_rate": 0.002322412883450996, "loss": 0.1245, "step": 17980 }, { "epoch": 0.45, "learning_rate": 0.002322036027435118, "loss": 0.126, "step": 17990 }, { "epoch": 0.45, "learning_rate": 0.0023216591714192397, "loss": 0.1274, "step": 18000 }, { "epoch": 0.45, "eval_cer": 0.6665598335328033, "eval_loss": 0.09775370359420776, "eval_runtime": 90.7418, "eval_samples_per_second": 110.192, "eval_steps_per_second": 6.888, "step": 18000 }, { "epoch": 0.45, "learning_rate": 0.002321282315403362, "loss": 0.1237, "step": 18010 }, { "epoch": 0.45, "learning_rate": 0.002320905459387483, "loss": 0.1249, "step": 18020 }, { "epoch": 0.45, "learning_rate": 0.0023205286033716054, "loss": 0.1234, "step": 18030 }, { "epoch": 0.45, "learning_rate": 0.002320151747355727, "loss": 0.1262, "step": 18040 }, { "epoch": 0.45, "learning_rate": 0.002319774891339849, "loss": 0.1243, "step": 18050 }, { "epoch": 0.45, "learning_rate": 0.0023193980353239706, "loss": 0.1269, "step": 18060 }, { "epoch": 0.45, "learning_rate": 0.0023190211793080923, "loss": 0.12, "step": 18070 }, { "epoch": 0.45, "learning_rate": 0.002318644323292214, "loss": 0.123, "step": 18080 }, { "epoch": 0.45, "learning_rate": 0.002318267467276336, "loss": 0.1257, "step": 18090 }, { "epoch": 0.45, "learning_rate": 0.0023178906112604576, "loss": 0.1206, "step": 18100 }, { "epoch": 0.45, "learning_rate": 0.0023175137552445798, "loss": 0.1256, "step": 18110 }, { "epoch": 0.46, "learning_rate": 0.0023171368992287015, "loss": 0.1233, "step": 18120 }, { "epoch": 0.46, "learning_rate": 0.0023167600432128233, "loss": 0.1218, "step": 18130 }, { "epoch": 0.46, "learning_rate": 0.002316383187196945, "loss": 0.1226, "step": 18140 }, { "epoch": 0.46, "learning_rate": 0.0023160063311810667, "loss": 0.1261, "step": 18150 }, { "epoch": 0.46, "learning_rate": 0.002315629475165189, "loss": 0.1266, "step": 18160 }, { "epoch": 0.46, "learning_rate": 0.0023152526191493102, "loss": 0.1251, "step": 18170 }, { "epoch": 0.46, "learning_rate": 0.002314875763133432, "loss": 0.1207, "step": 18180 }, { "epoch": 0.46, "learning_rate": 0.002314498907117554, "loss": 0.1216, "step": 18190 }, { "epoch": 0.46, "learning_rate": 0.002314122051101676, "loss": 0.1245, "step": 18200 }, { "epoch": 0.46, "learning_rate": 0.0023137451950857976, "loss": 0.1237, "step": 18210 }, { "epoch": 0.46, "learning_rate": 0.0023133683390699194, "loss": 0.1242, "step": 18220 }, { "epoch": 0.46, "learning_rate": 0.002312991483054041, "loss": 0.1258, "step": 18230 }, { "epoch": 0.46, "learning_rate": 0.0023126146270381633, "loss": 0.1235, "step": 18240 }, { "epoch": 0.46, "learning_rate": 0.0023122377710222846, "loss": 0.1249, "step": 18250 }, { "epoch": 0.46, "learning_rate": 0.002311860915006407, "loss": 0.1215, "step": 18260 }, { "epoch": 0.46, "learning_rate": 0.0023114840589905285, "loss": 0.1191, "step": 18270 }, { "epoch": 0.46, "learning_rate": 0.00231110720297465, "loss": 0.124, "step": 18280 }, { "epoch": 0.46, "learning_rate": 0.002310730346958772, "loss": 0.118, "step": 18290 }, { "epoch": 0.46, "learning_rate": 0.0023103534909428938, "loss": 0.1242, "step": 18300 }, { "epoch": 0.46, "learning_rate": 0.0023099766349270155, "loss": 0.1194, "step": 18310 }, { "epoch": 0.46, "learning_rate": 0.0023095997789111373, "loss": 0.1201, "step": 18320 }, { "epoch": 0.46, "learning_rate": 0.002309222922895259, "loss": 0.124, "step": 18330 }, { "epoch": 0.46, "learning_rate": 0.002308846066879381, "loss": 0.1186, "step": 18340 }, { "epoch": 0.46, "learning_rate": 0.002308469210863503, "loss": 0.1269, "step": 18350 }, { "epoch": 0.46, "learning_rate": 0.0023080923548476247, "loss": 0.1216, "step": 18360 }, { "epoch": 0.46, "learning_rate": 0.0023077154988317464, "loss": 0.1281, "step": 18370 }, { "epoch": 0.46, "learning_rate": 0.002307338642815868, "loss": 0.1173, "step": 18380 }, { "epoch": 0.46, "learning_rate": 0.0023069617867999903, "loss": 0.1263, "step": 18390 }, { "epoch": 0.46, "learning_rate": 0.0023065849307841117, "loss": 0.1241, "step": 18400 }, { "epoch": 0.46, "learning_rate": 0.0023062080747682334, "loss": 0.1192, "step": 18410 }, { "epoch": 0.46, "learning_rate": 0.0023058312187523556, "loss": 0.1211, "step": 18420 }, { "epoch": 0.46, "learning_rate": 0.0023054543627364773, "loss": 0.1245, "step": 18430 }, { "epoch": 0.46, "learning_rate": 0.002305077506720599, "loss": 0.1278, "step": 18440 }, { "epoch": 0.46, "learning_rate": 0.002304700650704721, "loss": 0.1201, "step": 18450 }, { "epoch": 0.46, "learning_rate": 0.0023043237946888426, "loss": 0.1232, "step": 18460 }, { "epoch": 0.46, "learning_rate": 0.0023039469386729643, "loss": 0.1217, "step": 18470 }, { "epoch": 0.46, "learning_rate": 0.002303570082657086, "loss": 0.1234, "step": 18480 }, { "epoch": 0.46, "learning_rate": 0.002303193226641208, "loss": 0.1227, "step": 18490 }, { "epoch": 0.46, "learning_rate": 0.00230281637062533, "loss": 0.127, "step": 18500 }, { "epoch": 0.46, "eval_cer": 0.666954442405632, "eval_loss": 0.09521838277578354, "eval_runtime": 90.8104, "eval_samples_per_second": 110.108, "eval_steps_per_second": 6.882, "step": 18500 }, { "epoch": 0.47, "learning_rate": 0.0023024395146094513, "loss": 0.1223, "step": 18510 }, { "epoch": 0.47, "learning_rate": 0.0023020626585935735, "loss": 0.1227, "step": 18520 }, { "epoch": 0.47, "learning_rate": 0.002301685802577695, "loss": 0.125, "step": 18530 }, { "epoch": 0.47, "learning_rate": 0.002301308946561817, "loss": 0.1247, "step": 18540 }, { "epoch": 0.47, "learning_rate": 0.0023009320905459387, "loss": 0.123, "step": 18550 }, { "epoch": 0.47, "learning_rate": 0.0023005552345300604, "loss": 0.1183, "step": 18560 }, { "epoch": 0.47, "learning_rate": 0.0023001783785141826, "loss": 0.1241, "step": 18570 }, { "epoch": 0.47, "learning_rate": 0.0022998015224983044, "loss": 0.1171, "step": 18580 }, { "epoch": 0.47, "learning_rate": 0.0022994246664824257, "loss": 0.1219, "step": 18590 }, { "epoch": 0.47, "learning_rate": 0.002299047810466548, "loss": 0.1205, "step": 18600 }, { "epoch": 0.47, "learning_rate": 0.0022986709544506696, "loss": 0.1256, "step": 18610 }, { "epoch": 0.47, "learning_rate": 0.0022982940984347913, "loss": 0.1216, "step": 18620 }, { "epoch": 0.47, "learning_rate": 0.002297917242418913, "loss": 0.1178, "step": 18630 }, { "epoch": 0.47, "learning_rate": 0.002297540386403035, "loss": 0.1251, "step": 18640 }, { "epoch": 0.47, "learning_rate": 0.002297163530387157, "loss": 0.1244, "step": 18650 }, { "epoch": 0.47, "learning_rate": 0.0022967866743712788, "loss": 0.1232, "step": 18660 }, { "epoch": 0.47, "learning_rate": 0.0022964098183554005, "loss": 0.122, "step": 18670 }, { "epoch": 0.47, "learning_rate": 0.0022960329623395222, "loss": 0.1202, "step": 18680 }, { "epoch": 0.47, "learning_rate": 0.002295656106323644, "loss": 0.121, "step": 18690 }, { "epoch": 0.47, "learning_rate": 0.0022952792503077657, "loss": 0.1192, "step": 18700 }, { "epoch": 0.47, "learning_rate": 0.0022949023942918875, "loss": 0.1214, "step": 18710 }, { "epoch": 0.47, "learning_rate": 0.0022945255382760092, "loss": 0.1244, "step": 18720 }, { "epoch": 0.47, "learning_rate": 0.0022941486822601314, "loss": 0.1192, "step": 18730 }, { "epoch": 0.47, "learning_rate": 0.0022937718262442527, "loss": 0.1202, "step": 18740 }, { "epoch": 0.47, "learning_rate": 0.002293394970228375, "loss": 0.1208, "step": 18750 }, { "epoch": 0.47, "learning_rate": 0.0022930181142124966, "loss": 0.1224, "step": 18760 }, { "epoch": 0.47, "learning_rate": 0.0022926412581966184, "loss": 0.1217, "step": 18770 }, { "epoch": 0.47, "learning_rate": 0.00229226440218074, "loss": 0.1192, "step": 18780 }, { "epoch": 0.47, "learning_rate": 0.002291887546164862, "loss": 0.1227, "step": 18790 }, { "epoch": 0.47, "learning_rate": 0.002291510690148984, "loss": 0.1202, "step": 18800 }, { "epoch": 0.47, "learning_rate": 0.002291133834133106, "loss": 0.1191, "step": 18810 }, { "epoch": 0.47, "learning_rate": 0.002290756978117227, "loss": 0.1211, "step": 18820 }, { "epoch": 0.47, "learning_rate": 0.0022903801221013493, "loss": 0.1165, "step": 18830 }, { "epoch": 0.47, "learning_rate": 0.002290003266085471, "loss": 0.1223, "step": 18840 }, { "epoch": 0.47, "learning_rate": 0.0022896264100695928, "loss": 0.1191, "step": 18850 }, { "epoch": 0.47, "learning_rate": 0.0022892495540537145, "loss": 0.1233, "step": 18860 }, { "epoch": 0.47, "learning_rate": 0.0022888726980378363, "loss": 0.1229, "step": 18870 }, { "epoch": 0.47, "learning_rate": 0.0022884958420219584, "loss": 0.1229, "step": 18880 }, { "epoch": 0.47, "learning_rate": 0.00228811898600608, "loss": 0.1148, "step": 18890 }, { "epoch": 0.47, "learning_rate": 0.0022877421299902015, "loss": 0.122, "step": 18900 }, { "epoch": 0.48, "learning_rate": 0.0022873652739743237, "loss": 0.1173, "step": 18910 }, { "epoch": 0.48, "learning_rate": 0.0022869884179584454, "loss": 0.1202, "step": 18920 }, { "epoch": 0.48, "learning_rate": 0.002286611561942567, "loss": 0.1187, "step": 18930 }, { "epoch": 0.48, "learning_rate": 0.002286234705926689, "loss": 0.1185, "step": 18940 }, { "epoch": 0.48, "learning_rate": 0.0022858578499108106, "loss": 0.1197, "step": 18950 }, { "epoch": 0.48, "learning_rate": 0.002285480993894933, "loss": 0.1194, "step": 18960 }, { "epoch": 0.48, "learning_rate": 0.002285104137879054, "loss": 0.1173, "step": 18970 }, { "epoch": 0.48, "learning_rate": 0.0022847272818631763, "loss": 0.1204, "step": 18980 }, { "epoch": 0.48, "learning_rate": 0.002284350425847298, "loss": 0.122, "step": 18990 }, { "epoch": 0.48, "learning_rate": 0.00228397356983142, "loss": 0.1218, "step": 19000 }, { "epoch": 0.48, "eval_cer": 0.6666175811727294, "eval_loss": 0.09327735006809235, "eval_runtime": 90.7107, "eval_samples_per_second": 110.23, "eval_steps_per_second": 6.89, "step": 19000 }, { "epoch": 0.48, "learning_rate": 0.0022835967138155415, "loss": 0.1221, "step": 19010 }, { "epoch": 0.48, "learning_rate": 0.0022832198577996633, "loss": 0.116, "step": 19020 }, { "epoch": 0.48, "learning_rate": 0.002282843001783785, "loss": 0.1177, "step": 19030 }, { "epoch": 0.48, "learning_rate": 0.002282466145767907, "loss": 0.1163, "step": 19040 }, { "epoch": 0.48, "learning_rate": 0.0022820892897520285, "loss": 0.1187, "step": 19050 }, { "epoch": 0.48, "learning_rate": 0.0022817124337361507, "loss": 0.1194, "step": 19060 }, { "epoch": 0.48, "learning_rate": 0.0022813355777202724, "loss": 0.1258, "step": 19070 }, { "epoch": 0.48, "learning_rate": 0.002280958721704394, "loss": 0.1166, "step": 19080 }, { "epoch": 0.48, "learning_rate": 0.002280581865688516, "loss": 0.1228, "step": 19090 }, { "epoch": 0.48, "learning_rate": 0.0022802050096726377, "loss": 0.1203, "step": 19100 }, { "epoch": 0.48, "learning_rate": 0.00227982815365676, "loss": 0.1189, "step": 19110 }, { "epoch": 0.48, "learning_rate": 0.0022794512976408816, "loss": 0.122, "step": 19120 }, { "epoch": 0.48, "learning_rate": 0.002279074441625003, "loss": 0.124, "step": 19130 }, { "epoch": 0.48, "learning_rate": 0.002278697585609125, "loss": 0.1167, "step": 19140 }, { "epoch": 0.48, "learning_rate": 0.002278320729593247, "loss": 0.1135, "step": 19150 }, { "epoch": 0.48, "learning_rate": 0.0022779438735773686, "loss": 0.1167, "step": 19160 }, { "epoch": 0.48, "learning_rate": 0.0022775670175614903, "loss": 0.1166, "step": 19170 }, { "epoch": 0.48, "learning_rate": 0.002277190161545612, "loss": 0.121, "step": 19180 }, { "epoch": 0.48, "learning_rate": 0.0022768133055297343, "loss": 0.1165, "step": 19190 }, { "epoch": 0.48, "learning_rate": 0.0022764364495138556, "loss": 0.1173, "step": 19200 }, { "epoch": 0.48, "learning_rate": 0.0022760595934979777, "loss": 0.1213, "step": 19210 }, { "epoch": 0.48, "learning_rate": 0.0022756827374820995, "loss": 0.1188, "step": 19220 }, { "epoch": 0.48, "learning_rate": 0.0022753058814662212, "loss": 0.1217, "step": 19230 }, { "epoch": 0.48, "learning_rate": 0.002274929025450343, "loss": 0.1161, "step": 19240 }, { "epoch": 0.48, "learning_rate": 0.0022745521694344647, "loss": 0.1178, "step": 19250 }, { "epoch": 0.48, "learning_rate": 0.0022741753134185865, "loss": 0.1174, "step": 19260 }, { "epoch": 0.48, "learning_rate": 0.0022737984574027086, "loss": 0.1216, "step": 19270 }, { "epoch": 0.48, "learning_rate": 0.00227342160138683, "loss": 0.1221, "step": 19280 }, { "epoch": 0.48, "learning_rate": 0.002273044745370952, "loss": 0.1164, "step": 19290 }, { "epoch": 0.48, "learning_rate": 0.002272667889355074, "loss": 0.1192, "step": 19300 }, { "epoch": 0.49, "learning_rate": 0.0022722910333391956, "loss": 0.1179, "step": 19310 }, { "epoch": 0.49, "learning_rate": 0.0022719141773233174, "loss": 0.1218, "step": 19320 }, { "epoch": 0.49, "learning_rate": 0.002271537321307439, "loss": 0.1203, "step": 19330 }, { "epoch": 0.49, "learning_rate": 0.002271160465291561, "loss": 0.1147, "step": 19340 }, { "epoch": 0.49, "learning_rate": 0.002270783609275683, "loss": 0.1206, "step": 19350 }, { "epoch": 0.49, "learning_rate": 0.0022704067532598043, "loss": 0.1198, "step": 19360 }, { "epoch": 0.49, "learning_rate": 0.0022700298972439265, "loss": 0.1178, "step": 19370 }, { "epoch": 0.49, "learning_rate": 0.0022696530412280483, "loss": 0.1152, "step": 19380 }, { "epoch": 0.49, "learning_rate": 0.00226927618521217, "loss": 0.1182, "step": 19390 }, { "epoch": 0.49, "learning_rate": 0.0022688993291962918, "loss": 0.1174, "step": 19400 }, { "epoch": 0.49, "learning_rate": 0.0022685224731804135, "loss": 0.1188, "step": 19410 }, { "epoch": 0.49, "learning_rate": 0.0022681456171645357, "loss": 0.1168, "step": 19420 }, { "epoch": 0.49, "learning_rate": 0.002267768761148657, "loss": 0.1203, "step": 19430 }, { "epoch": 0.49, "learning_rate": 0.0022673919051327787, "loss": 0.1236, "step": 19440 }, { "epoch": 0.49, "learning_rate": 0.002267015049116901, "loss": 0.1227, "step": 19450 }, { "epoch": 0.49, "learning_rate": 0.0022666381931010227, "loss": 0.1164, "step": 19460 }, { "epoch": 0.49, "learning_rate": 0.0022662613370851444, "loss": 0.117, "step": 19470 }, { "epoch": 0.49, "learning_rate": 0.002265884481069266, "loss": 0.117, "step": 19480 }, { "epoch": 0.49, "learning_rate": 0.002265507625053388, "loss": 0.1143, "step": 19490 }, { "epoch": 0.49, "learning_rate": 0.00226513076903751, "loss": 0.1196, "step": 19500 }, { "epoch": 0.49, "eval_cer": 0.6669568485572955, "eval_loss": 0.09227263927459717, "eval_runtime": 90.7185, "eval_samples_per_second": 110.22, "eval_steps_per_second": 6.889, "step": 19500 }, { "epoch": 0.49, "learning_rate": 0.0022647539130216314, "loss": 0.1182, "step": 19510 }, { "epoch": 0.49, "learning_rate": 0.0022643770570057536, "loss": 0.1229, "step": 19520 }, { "epoch": 0.49, "learning_rate": 0.0022640002009898753, "loss": 0.119, "step": 19530 }, { "epoch": 0.49, "learning_rate": 0.002263623344973997, "loss": 0.1206, "step": 19540 }, { "epoch": 0.49, "learning_rate": 0.002263246488958119, "loss": 0.1215, "step": 19550 }, { "epoch": 0.49, "learning_rate": 0.0022628696329422405, "loss": 0.1164, "step": 19560 }, { "epoch": 0.49, "learning_rate": 0.0022624927769263623, "loss": 0.1196, "step": 19570 }, { "epoch": 0.49, "learning_rate": 0.002262115920910484, "loss": 0.1197, "step": 19580 }, { "epoch": 0.49, "learning_rate": 0.0022617390648946058, "loss": 0.1172, "step": 19590 }, { "epoch": 0.49, "learning_rate": 0.002261362208878728, "loss": 0.12, "step": 19600 }, { "epoch": 0.49, "learning_rate": 0.0022609853528628497, "loss": 0.1218, "step": 19610 }, { "epoch": 0.49, "learning_rate": 0.0022606084968469714, "loss": 0.1144, "step": 19620 }, { "epoch": 0.49, "learning_rate": 0.002260231640831093, "loss": 0.1146, "step": 19630 }, { "epoch": 0.49, "learning_rate": 0.002259854784815215, "loss": 0.1174, "step": 19640 }, { "epoch": 0.49, "learning_rate": 0.002259477928799337, "loss": 0.1192, "step": 19650 }, { "epoch": 0.49, "learning_rate": 0.0022591010727834584, "loss": 0.1187, "step": 19660 }, { "epoch": 0.49, "learning_rate": 0.00225872421676758, "loss": 0.1168, "step": 19670 }, { "epoch": 0.49, "learning_rate": 0.0022583473607517023, "loss": 0.1135, "step": 19680 }, { "epoch": 0.49, "learning_rate": 0.002257970504735824, "loss": 0.1226, "step": 19690 }, { "epoch": 0.49, "learning_rate": 0.002257593648719946, "loss": 0.1168, "step": 19700 }, { "epoch": 0.5, "learning_rate": 0.0022572167927040676, "loss": 0.1186, "step": 19710 }, { "epoch": 0.5, "learning_rate": 0.0022568399366881893, "loss": 0.1157, "step": 19720 }, { "epoch": 0.5, "learning_rate": 0.0022564630806723115, "loss": 0.12, "step": 19730 }, { "epoch": 0.5, "learning_rate": 0.002256086224656433, "loss": 0.1199, "step": 19740 }, { "epoch": 0.5, "learning_rate": 0.0022557093686405546, "loss": 0.1184, "step": 19750 }, { "epoch": 0.5, "learning_rate": 0.0022553325126246767, "loss": 0.1196, "step": 19760 }, { "epoch": 0.5, "learning_rate": 0.0022549556566087985, "loss": 0.1181, "step": 19770 }, { "epoch": 0.5, "learning_rate": 0.0022545788005929202, "loss": 0.12, "step": 19780 }, { "epoch": 0.5, "learning_rate": 0.002254201944577042, "loss": 0.1205, "step": 19790 }, { "epoch": 0.5, "learning_rate": 0.0022538250885611637, "loss": 0.1222, "step": 19800 }, { "epoch": 0.5, "learning_rate": 0.0022534482325452855, "loss": 0.1145, "step": 19810 }, { "epoch": 0.5, "learning_rate": 0.002253071376529407, "loss": 0.1165, "step": 19820 }, { "epoch": 0.5, "learning_rate": 0.0022526945205135294, "loss": 0.1159, "step": 19830 }, { "epoch": 0.5, "learning_rate": 0.002252317664497651, "loss": 0.1232, "step": 19840 }, { "epoch": 0.5, "learning_rate": 0.0022519408084817724, "loss": 0.1218, "step": 19850 }, { "epoch": 0.5, "learning_rate": 0.0022515639524658946, "loss": 0.1184, "step": 19860 }, { "epoch": 0.5, "learning_rate": 0.0022511870964500164, "loss": 0.122, "step": 19870 }, { "epoch": 0.5, "learning_rate": 0.002250810240434138, "loss": 0.1124, "step": 19880 }, { "epoch": 0.5, "learning_rate": 0.00225043338441826, "loss": 0.1178, "step": 19890 }, { "epoch": 0.5, "learning_rate": 0.0022500565284023816, "loss": 0.1173, "step": 19900 }, { "epoch": 0.5, "learning_rate": 0.0022496796723865038, "loss": 0.1223, "step": 19910 }, { "epoch": 0.5, "learning_rate": 0.0022493028163706255, "loss": 0.1175, "step": 19920 }, { "epoch": 0.5, "learning_rate": 0.0022489259603547473, "loss": 0.1188, "step": 19930 }, { "epoch": 0.5, "learning_rate": 0.002248549104338869, "loss": 0.1198, "step": 19940 }, { "epoch": 0.5, "learning_rate": 0.0022481722483229907, "loss": 0.1179, "step": 19950 }, { "epoch": 0.5, "learning_rate": 0.002247795392307113, "loss": 0.1201, "step": 19960 }, { "epoch": 0.5, "learning_rate": 0.0022474185362912342, "loss": 0.1225, "step": 19970 }, { "epoch": 0.5, "learning_rate": 0.002247041680275356, "loss": 0.1212, "step": 19980 }, { "epoch": 0.5, "learning_rate": 0.002246664824259478, "loss": 0.1194, "step": 19990 }, { "epoch": 0.5, "learning_rate": 0.0022462879682436, "loss": 0.1192, "step": 20000 }, { "epoch": 0.5, "eval_cer": 0.6664963111288845, "eval_loss": 0.092043936252594, "eval_runtime": 90.451, "eval_samples_per_second": 110.546, "eval_steps_per_second": 6.91, "step": 20000 }, { "epoch": 0.5, "learning_rate": 0.0022459111122277216, "loss": 0.1115, "step": 20010 }, { "epoch": 0.5, "learning_rate": 0.0022455342562118434, "loss": 0.1164, "step": 20020 }, { "epoch": 0.5, "learning_rate": 0.002245157400195965, "loss": 0.1172, "step": 20030 }, { "epoch": 0.5, "learning_rate": 0.002244780544180087, "loss": 0.1178, "step": 20040 }, { "epoch": 0.5, "learning_rate": 0.0022444036881642086, "loss": 0.1159, "step": 20050 }, { "epoch": 0.5, "learning_rate": 0.0022440268321483304, "loss": 0.1169, "step": 20060 }, { "epoch": 0.5, "learning_rate": 0.0022436499761324525, "loss": 0.1225, "step": 20070 }, { "epoch": 0.5, "learning_rate": 0.002243273120116574, "loss": 0.1197, "step": 20080 }, { "epoch": 0.5, "learning_rate": 0.002242896264100696, "loss": 0.1165, "step": 20090 }, { "epoch": 0.5, "learning_rate": 0.002242519408084818, "loss": 0.1179, "step": 20100 }, { "epoch": 0.51, "learning_rate": 0.0022421425520689395, "loss": 0.1151, "step": 20110 }, { "epoch": 0.51, "learning_rate": 0.0022417656960530613, "loss": 0.1182, "step": 20120 }, { "epoch": 0.51, "learning_rate": 0.002241388840037183, "loss": 0.1153, "step": 20130 }, { "epoch": 0.51, "learning_rate": 0.002241011984021305, "loss": 0.1169, "step": 20140 }, { "epoch": 0.51, "learning_rate": 0.002240635128005427, "loss": 0.1147, "step": 20150 }, { "epoch": 0.51, "learning_rate": 0.0022402582719895483, "loss": 0.1198, "step": 20160 }, { "epoch": 0.51, "learning_rate": 0.0022398814159736704, "loss": 0.1145, "step": 20170 }, { "epoch": 0.51, "learning_rate": 0.002239504559957792, "loss": 0.1199, "step": 20180 }, { "epoch": 0.51, "learning_rate": 0.002239127703941914, "loss": 0.1185, "step": 20190 }, { "epoch": 0.51, "learning_rate": 0.0022387508479260357, "loss": 0.1161, "step": 20200 }, { "epoch": 0.51, "learning_rate": 0.0022383739919101574, "loss": 0.1151, "step": 20210 }, { "epoch": 0.51, "learning_rate": 0.0022379971358942796, "loss": 0.1166, "step": 20220 }, { "epoch": 0.51, "learning_rate": 0.0022376202798784013, "loss": 0.1154, "step": 20230 }, { "epoch": 0.51, "learning_rate": 0.002237243423862523, "loss": 0.113, "step": 20240 }, { "epoch": 0.51, "learning_rate": 0.002236866567846645, "loss": 0.117, "step": 20250 }, { "epoch": 0.51, "learning_rate": 0.0022364897118307666, "loss": 0.1133, "step": 20260 }, { "epoch": 0.51, "learning_rate": 0.0022361128558148883, "loss": 0.1151, "step": 20270 }, { "epoch": 0.51, "learning_rate": 0.00223573599979901, "loss": 0.1179, "step": 20280 }, { "epoch": 0.51, "learning_rate": 0.002235359143783132, "loss": 0.1155, "step": 20290 }, { "epoch": 0.51, "learning_rate": 0.002234982287767254, "loss": 0.1183, "step": 20300 }, { "epoch": 0.51, "learning_rate": 0.0022346054317513753, "loss": 0.1147, "step": 20310 }, { "epoch": 0.51, "learning_rate": 0.0022342285757354975, "loss": 0.1121, "step": 20320 }, { "epoch": 0.51, "learning_rate": 0.002233851719719619, "loss": 0.1151, "step": 20330 }, { "epoch": 0.51, "learning_rate": 0.002233474863703741, "loss": 0.1132, "step": 20340 }, { "epoch": 0.51, "learning_rate": 0.0022330980076878627, "loss": 0.112, "step": 20350 }, { "epoch": 0.51, "learning_rate": 0.0022327211516719844, "loss": 0.117, "step": 20360 }, { "epoch": 0.51, "learning_rate": 0.0022323442956561066, "loss": 0.1193, "step": 20370 }, { "epoch": 0.51, "learning_rate": 0.0022319674396402284, "loss": 0.1169, "step": 20380 }, { "epoch": 0.51, "learning_rate": 0.0022315905836243497, "loss": 0.1149, "step": 20390 }, { "epoch": 0.51, "learning_rate": 0.002231213727608472, "loss": 0.117, "step": 20400 }, { "epoch": 0.51, "learning_rate": 0.0022308368715925936, "loss": 0.1156, "step": 20410 }, { "epoch": 0.51, "learning_rate": 0.0022304600155767153, "loss": 0.1151, "step": 20420 }, { "epoch": 0.51, "learning_rate": 0.002230083159560837, "loss": 0.1175, "step": 20430 }, { "epoch": 0.51, "learning_rate": 0.002229706303544959, "loss": 0.1186, "step": 20440 }, { "epoch": 0.51, "learning_rate": 0.002229329447529081, "loss": 0.1189, "step": 20450 }, { "epoch": 0.51, "learning_rate": 0.0022289525915132028, "loss": 0.1145, "step": 20460 }, { "epoch": 0.51, "learning_rate": 0.002228575735497324, "loss": 0.1116, "step": 20470 }, { "epoch": 0.51, "learning_rate": 0.0022281988794814462, "loss": 0.1133, "step": 20480 }, { "epoch": 0.51, "learning_rate": 0.002227822023465568, "loss": 0.1166, "step": 20490 }, { "epoch": 0.52, "learning_rate": 0.0022274451674496897, "loss": 0.1171, "step": 20500 }, { "epoch": 0.52, "eval_cer": 0.6664255702699751, "eval_loss": 0.09097065031528473, "eval_runtime": 90.5473, "eval_samples_per_second": 110.428, "eval_steps_per_second": 6.902, "step": 20500 }, { "epoch": 0.52, "learning_rate": 0.0022270683114338115, "loss": 0.1169, "step": 20510 }, { "epoch": 0.52, "learning_rate": 0.0022266914554179332, "loss": 0.1147, "step": 20520 }, { "epoch": 0.52, "learning_rate": 0.0022263145994020554, "loss": 0.1185, "step": 20530 }, { "epoch": 0.52, "learning_rate": 0.0022259377433861767, "loss": 0.1151, "step": 20540 }, { "epoch": 0.52, "learning_rate": 0.002225560887370299, "loss": 0.1262, "step": 20550 }, { "epoch": 0.52, "learning_rate": 0.0022251840313544206, "loss": 0.1153, "step": 20560 }, { "epoch": 0.52, "learning_rate": 0.0022248071753385424, "loss": 0.1152, "step": 20570 }, { "epoch": 0.52, "learning_rate": 0.002224430319322664, "loss": 0.116, "step": 20580 }, { "epoch": 0.52, "learning_rate": 0.002224053463306786, "loss": 0.1174, "step": 20590 }, { "epoch": 0.52, "learning_rate": 0.0022236766072909076, "loss": 0.1168, "step": 20600 }, { "epoch": 0.52, "learning_rate": 0.00222329975127503, "loss": 0.1212, "step": 20610 }, { "epoch": 0.52, "learning_rate": 0.002222922895259151, "loss": 0.1179, "step": 20620 }, { "epoch": 0.52, "learning_rate": 0.0022225460392432733, "loss": 0.1173, "step": 20630 }, { "epoch": 0.52, "learning_rate": 0.002222169183227395, "loss": 0.1177, "step": 20640 }, { "epoch": 0.52, "learning_rate": 0.0022217923272115168, "loss": 0.1143, "step": 20650 }, { "epoch": 0.52, "learning_rate": 0.0022214154711956385, "loss": 0.1165, "step": 20660 }, { "epoch": 0.52, "learning_rate": 0.0022210386151797603, "loss": 0.1171, "step": 20670 }, { "epoch": 0.52, "learning_rate": 0.0022206617591638824, "loss": 0.1179, "step": 20680 }, { "epoch": 0.52, "learning_rate": 0.002220284903148004, "loss": 0.1132, "step": 20690 }, { "epoch": 0.52, "learning_rate": 0.0022199080471321255, "loss": 0.1157, "step": 20700 }, { "epoch": 0.52, "learning_rate": 0.0022195311911162477, "loss": 0.1183, "step": 20710 }, { "epoch": 0.52, "learning_rate": 0.0022191543351003694, "loss": 0.1109, "step": 20720 }, { "epoch": 0.52, "learning_rate": 0.002218777479084491, "loss": 0.1149, "step": 20730 }, { "epoch": 0.52, "learning_rate": 0.002218400623068613, "loss": 0.1176, "step": 20740 }, { "epoch": 0.52, "learning_rate": 0.0022180237670527347, "loss": 0.1171, "step": 20750 }, { "epoch": 0.52, "learning_rate": 0.002217646911036857, "loss": 0.1141, "step": 20760 }, { "epoch": 0.52, "learning_rate": 0.002217270055020978, "loss": 0.1177, "step": 20770 }, { "epoch": 0.52, "learning_rate": 0.0022168931990051003, "loss": 0.1168, "step": 20780 }, { "epoch": 0.52, "learning_rate": 0.002216516342989222, "loss": 0.1154, "step": 20790 }, { "epoch": 0.52, "learning_rate": 0.002216139486973344, "loss": 0.117, "step": 20800 }, { "epoch": 0.52, "learning_rate": 0.0022157626309574656, "loss": 0.1117, "step": 20810 }, { "epoch": 0.52, "learning_rate": 0.0022153857749415873, "loss": 0.1193, "step": 20820 }, { "epoch": 0.52, "learning_rate": 0.002215008918925709, "loss": 0.1155, "step": 20830 }, { "epoch": 0.52, "learning_rate": 0.0022146320629098312, "loss": 0.1168, "step": 20840 }, { "epoch": 0.52, "learning_rate": 0.0022142552068939525, "loss": 0.1174, "step": 20850 }, { "epoch": 0.52, "learning_rate": 0.0022138783508780747, "loss": 0.1157, "step": 20860 }, { "epoch": 0.52, "learning_rate": 0.0022135014948621965, "loss": 0.1179, "step": 20870 }, { "epoch": 0.52, "learning_rate": 0.002213124638846318, "loss": 0.1193, "step": 20880 }, { "epoch": 0.52, "learning_rate": 0.00221274778283044, "loss": 0.1098, "step": 20890 }, { "epoch": 0.53, "learning_rate": 0.0022123709268145617, "loss": 0.1113, "step": 20900 }, { "epoch": 0.53, "learning_rate": 0.0022119940707986834, "loss": 0.1159, "step": 20910 }, { "epoch": 0.53, "learning_rate": 0.002211617214782805, "loss": 0.115, "step": 20920 }, { "epoch": 0.53, "learning_rate": 0.002211240358766927, "loss": 0.1144, "step": 20930 }, { "epoch": 0.53, "learning_rate": 0.002210863502751049, "loss": 0.1148, "step": 20940 }, { "epoch": 0.53, "learning_rate": 0.002210486646735171, "loss": 0.1135, "step": 20950 }, { "epoch": 0.53, "learning_rate": 0.0022101097907192926, "loss": 0.1133, "step": 20960 }, { "epoch": 0.53, "learning_rate": 0.0022097329347034143, "loss": 0.1146, "step": 20970 }, { "epoch": 0.53, "learning_rate": 0.002209356078687536, "loss": 0.1112, "step": 20980 }, { "epoch": 0.53, "learning_rate": 0.0022089792226716583, "loss": 0.1161, "step": 20990 }, { "epoch": 0.53, "learning_rate": 0.0022086023666557796, "loss": 0.1153, "step": 21000 }, { "epoch": 0.53, "eval_cer": 0.6667460696715651, "eval_loss": 0.09056726843118668, "eval_runtime": 90.5012, "eval_samples_per_second": 110.485, "eval_steps_per_second": 6.906, "step": 21000 }, { "epoch": 0.53, "learning_rate": 0.0022082255106399013, "loss": 0.1174, "step": 21010 }, { "epoch": 0.53, "learning_rate": 0.0022078486546240235, "loss": 0.1156, "step": 21020 }, { "epoch": 0.53, "learning_rate": 0.0022074717986081452, "loss": 0.1146, "step": 21030 }, { "epoch": 0.53, "learning_rate": 0.002207094942592267, "loss": 0.1141, "step": 21040 }, { "epoch": 0.53, "learning_rate": 0.0022067180865763887, "loss": 0.1204, "step": 21050 }, { "epoch": 0.53, "learning_rate": 0.0022063412305605105, "loss": 0.1143, "step": 21060 }, { "epoch": 0.53, "learning_rate": 0.0022059643745446327, "loss": 0.1137, "step": 21070 }, { "epoch": 0.53, "learning_rate": 0.002205587518528754, "loss": 0.1142, "step": 21080 }, { "epoch": 0.53, "learning_rate": 0.002205210662512876, "loss": 0.1162, "step": 21090 }, { "epoch": 0.53, "learning_rate": 0.002204833806496998, "loss": 0.1157, "step": 21100 }, { "epoch": 0.53, "learning_rate": 0.0022044569504811196, "loss": 0.1174, "step": 21110 }, { "epoch": 0.53, "learning_rate": 0.0022040800944652414, "loss": 0.1144, "step": 21120 }, { "epoch": 0.53, "learning_rate": 0.002203703238449363, "loss": 0.1112, "step": 21130 }, { "epoch": 0.53, "learning_rate": 0.002203326382433485, "loss": 0.1166, "step": 21140 }, { "epoch": 0.53, "learning_rate": 0.0022029495264176066, "loss": 0.1152, "step": 21150 }, { "epoch": 0.53, "learning_rate": 0.0022025726704017284, "loss": 0.1105, "step": 21160 }, { "epoch": 0.53, "learning_rate": 0.0022021958143858505, "loss": 0.1146, "step": 21170 }, { "epoch": 0.53, "learning_rate": 0.0022018189583699723, "loss": 0.1094, "step": 21180 }, { "epoch": 0.53, "learning_rate": 0.002201442102354094, "loss": 0.1152, "step": 21190 }, { "epoch": 0.53, "learning_rate": 0.0022010652463382158, "loss": 0.1148, "step": 21200 }, { "epoch": 0.53, "learning_rate": 0.0022006883903223375, "loss": 0.1176, "step": 21210 }, { "epoch": 0.53, "learning_rate": 0.0022003115343064597, "loss": 0.115, "step": 21220 }, { "epoch": 0.53, "learning_rate": 0.002199934678290581, "loss": 0.1175, "step": 21230 }, { "epoch": 0.53, "learning_rate": 0.0021995578222747027, "loss": 0.1085, "step": 21240 }, { "epoch": 0.53, "learning_rate": 0.002199180966258825, "loss": 0.119, "step": 21250 }, { "epoch": 0.53, "learning_rate": 0.0021988041102429467, "loss": 0.1126, "step": 21260 }, { "epoch": 0.53, "learning_rate": 0.0021984272542270684, "loss": 0.1117, "step": 21270 }, { "epoch": 0.53, "learning_rate": 0.00219805039821119, "loss": 0.1146, "step": 21280 }, { "epoch": 0.53, "learning_rate": 0.002197673542195312, "loss": 0.1172, "step": 21290 }, { "epoch": 0.54, "learning_rate": 0.002197296686179434, "loss": 0.1111, "step": 21300 }, { "epoch": 0.54, "learning_rate": 0.0021969198301635554, "loss": 0.113, "step": 21310 }, { "epoch": 0.54, "learning_rate": 0.002196542974147677, "loss": 0.1072, "step": 21320 }, { "epoch": 0.54, "learning_rate": 0.0021961661181317993, "loss": 0.1112, "step": 21330 }, { "epoch": 0.54, "learning_rate": 0.002195789262115921, "loss": 0.1138, "step": 21340 }, { "epoch": 0.54, "learning_rate": 0.002195412406100043, "loss": 0.1179, "step": 21350 }, { "epoch": 0.54, "learning_rate": 0.0021950355500841645, "loss": 0.1125, "step": 21360 }, { "epoch": 0.54, "learning_rate": 0.0021946586940682863, "loss": 0.116, "step": 21370 }, { "epoch": 0.54, "learning_rate": 0.002194281838052408, "loss": 0.1137, "step": 21380 }, { "epoch": 0.54, "learning_rate": 0.0021939049820365298, "loss": 0.1113, "step": 21390 }, { "epoch": 0.54, "learning_rate": 0.002193528126020652, "loss": 0.1131, "step": 21400 }, { "epoch": 0.54, "learning_rate": 0.0021931512700047737, "loss": 0.1159, "step": 21410 }, { "epoch": 0.54, "learning_rate": 0.002192774413988895, "loss": 0.1164, "step": 21420 }, { "epoch": 0.54, "learning_rate": 0.002192397557973017, "loss": 0.1153, "step": 21430 }, { "epoch": 0.54, "learning_rate": 0.002192020701957139, "loss": 0.1154, "step": 21440 }, { "epoch": 0.54, "learning_rate": 0.0021916438459412607, "loss": 0.1124, "step": 21450 }, { "epoch": 0.54, "learning_rate": 0.0021912669899253824, "loss": 0.1153, "step": 21460 }, { "epoch": 0.54, "learning_rate": 0.002190890133909504, "loss": 0.116, "step": 21470 }, { "epoch": 0.54, "learning_rate": 0.0021905132778936263, "loss": 0.1127, "step": 21480 }, { "epoch": 0.54, "learning_rate": 0.002190136421877748, "loss": 0.1138, "step": 21490 }, { "epoch": 0.54, "learning_rate": 0.00218975956586187, "loss": 0.1102, "step": 21500 }, { "epoch": 0.54, "eval_cer": 0.6668567526480902, "eval_loss": 0.08902458846569061, "eval_runtime": 90.6566, "eval_samples_per_second": 110.295, "eval_steps_per_second": 6.894, "step": 21500 }, { "epoch": 0.54, "learning_rate": 0.0021893827098459916, "loss": 0.1131, "step": 21510 }, { "epoch": 0.54, "learning_rate": 0.0021890058538301133, "loss": 0.1157, "step": 21520 }, { "epoch": 0.54, "learning_rate": 0.0021886289978142355, "loss": 0.1149, "step": 21530 }, { "epoch": 0.54, "learning_rate": 0.002188252141798357, "loss": 0.1186, "step": 21540 }, { "epoch": 0.54, "learning_rate": 0.0021878752857824786, "loss": 0.1136, "step": 21550 }, { "epoch": 0.54, "learning_rate": 0.0021874984297666007, "loss": 0.1118, "step": 21560 }, { "epoch": 0.54, "learning_rate": 0.0021871215737507225, "loss": 0.1162, "step": 21570 }, { "epoch": 0.54, "learning_rate": 0.0021867447177348442, "loss": 0.1141, "step": 21580 }, { "epoch": 0.54, "learning_rate": 0.002186367861718966, "loss": 0.1146, "step": 21590 }, { "epoch": 0.54, "learning_rate": 0.0021859910057030877, "loss": 0.1196, "step": 21600 }, { "epoch": 0.54, "learning_rate": 0.0021856141496872095, "loss": 0.114, "step": 21610 }, { "epoch": 0.54, "learning_rate": 0.002185237293671331, "loss": 0.1138, "step": 21620 }, { "epoch": 0.54, "learning_rate": 0.0021848604376554534, "loss": 0.1109, "step": 21630 }, { "epoch": 0.54, "learning_rate": 0.002184483581639575, "loss": 0.109, "step": 21640 }, { "epoch": 0.54, "learning_rate": 0.0021841067256236964, "loss": 0.1119, "step": 21650 }, { "epoch": 0.54, "learning_rate": 0.0021837298696078186, "loss": 0.1158, "step": 21660 }, { "epoch": 0.54, "learning_rate": 0.0021833530135919404, "loss": 0.1173, "step": 21670 }, { "epoch": 0.54, "learning_rate": 0.002182976157576062, "loss": 0.1134, "step": 21680 }, { "epoch": 0.54, "learning_rate": 0.002182599301560184, "loss": 0.114, "step": 21690 }, { "epoch": 0.55, "learning_rate": 0.0021822224455443056, "loss": 0.1112, "step": 21700 }, { "epoch": 0.55, "learning_rate": 0.0021818455895284278, "loss": 0.1179, "step": 21710 }, { "epoch": 0.55, "learning_rate": 0.0021814687335125495, "loss": 0.1152, "step": 21720 }, { "epoch": 0.55, "learning_rate": 0.002181091877496671, "loss": 0.1151, "step": 21730 }, { "epoch": 0.55, "learning_rate": 0.002180715021480793, "loss": 0.1141, "step": 21740 }, { "epoch": 0.55, "learning_rate": 0.0021803381654649148, "loss": 0.109, "step": 21750 }, { "epoch": 0.55, "learning_rate": 0.0021799613094490365, "loss": 0.1111, "step": 21760 }, { "epoch": 0.55, "learning_rate": 0.0021795844534331582, "loss": 0.1145, "step": 21770 }, { "epoch": 0.55, "learning_rate": 0.00217920759741728, "loss": 0.1118, "step": 21780 }, { "epoch": 0.55, "learning_rate": 0.002178830741401402, "loss": 0.1116, "step": 21790 }, { "epoch": 0.55, "learning_rate": 0.002178453885385524, "loss": 0.1155, "step": 21800 }, { "epoch": 0.55, "learning_rate": 0.0021780770293696457, "loss": 0.1132, "step": 21810 }, { "epoch": 0.55, "learning_rate": 0.0021777001733537674, "loss": 0.1149, "step": 21820 }, { "epoch": 0.55, "learning_rate": 0.002177323317337889, "loss": 0.1104, "step": 21830 }, { "epoch": 0.55, "learning_rate": 0.002176946461322011, "loss": 0.1162, "step": 21840 }, { "epoch": 0.55, "learning_rate": 0.0021765696053061326, "loss": 0.1115, "step": 21850 }, { "epoch": 0.55, "learning_rate": 0.0021761927492902544, "loss": 0.1138, "step": 21860 }, { "epoch": 0.55, "learning_rate": 0.0021758158932743766, "loss": 0.1107, "step": 21870 }, { "epoch": 0.55, "learning_rate": 0.002175439037258498, "loss": 0.1108, "step": 21880 }, { "epoch": 0.55, "learning_rate": 0.00217506218124262, "loss": 0.1127, "step": 21890 }, { "epoch": 0.55, "learning_rate": 0.002174685325226742, "loss": 0.1157, "step": 21900 }, { "epoch": 0.55, "learning_rate": 0.0021743084692108635, "loss": 0.1102, "step": 21910 }, { "epoch": 0.55, "learning_rate": 0.0021739316131949853, "loss": 0.1119, "step": 21920 }, { "epoch": 0.55, "learning_rate": 0.002173554757179107, "loss": 0.1193, "step": 21930 }, { "epoch": 0.55, "learning_rate": 0.002173177901163229, "loss": 0.1146, "step": 21940 }, { "epoch": 0.55, "learning_rate": 0.002172801045147351, "loss": 0.1112, "step": 21950 }, { "epoch": 0.55, "learning_rate": 0.0021724241891314723, "loss": 0.1088, "step": 21960 }, { "epoch": 0.55, "learning_rate": 0.0021720473331155944, "loss": 0.1114, "step": 21970 }, { "epoch": 0.55, "learning_rate": 0.002171670477099716, "loss": 0.1147, "step": 21980 }, { "epoch": 0.55, "learning_rate": 0.002171293621083838, "loss": 0.1102, "step": 21990 }, { "epoch": 0.55, "learning_rate": 0.0021709167650679597, "loss": 0.1147, "step": 22000 }, { "epoch": 0.55, "eval_cer": 0.666688322031639, "eval_loss": 0.08858127146959305, "eval_runtime": 90.7851, "eval_samples_per_second": 110.139, "eval_steps_per_second": 6.884, "step": 22000 }, { "epoch": 0.55, "learning_rate": 0.0021705399090520814, "loss": 0.1154, "step": 22010 }, { "epoch": 0.55, "learning_rate": 0.0021701630530362036, "loss": 0.1173, "step": 22020 }, { "epoch": 0.55, "learning_rate": 0.002169786197020325, "loss": 0.1106, "step": 22030 }, { "epoch": 0.55, "learning_rate": 0.002169409341004447, "loss": 0.1111, "step": 22040 }, { "epoch": 0.55, "learning_rate": 0.002169032484988569, "loss": 0.1086, "step": 22050 }, { "epoch": 0.55, "learning_rate": 0.0021686556289726906, "loss": 0.1112, "step": 22060 }, { "epoch": 0.55, "learning_rate": 0.0021682787729568123, "loss": 0.1127, "step": 22070 }, { "epoch": 0.55, "learning_rate": 0.002167901916940934, "loss": 0.1103, "step": 22080 }, { "epoch": 0.55, "learning_rate": 0.002167525060925056, "loss": 0.1123, "step": 22090 }, { "epoch": 0.56, "learning_rate": 0.002167148204909178, "loss": 0.1105, "step": 22100 }, { "epoch": 0.56, "learning_rate": 0.0021667713488932993, "loss": 0.1101, "step": 22110 }, { "epoch": 0.56, "learning_rate": 0.0021663944928774215, "loss": 0.1088, "step": 22120 }, { "epoch": 0.56, "learning_rate": 0.0021660176368615432, "loss": 0.1128, "step": 22130 }, { "epoch": 0.56, "learning_rate": 0.002165640780845665, "loss": 0.1125, "step": 22140 }, { "epoch": 0.56, "learning_rate": 0.0021652639248297867, "loss": 0.1112, "step": 22150 }, { "epoch": 0.56, "learning_rate": 0.0021648870688139085, "loss": 0.1094, "step": 22160 }, { "epoch": 0.56, "learning_rate": 0.00216451021279803, "loss": 0.1132, "step": 22170 }, { "epoch": 0.56, "learning_rate": 0.0021641333567821524, "loss": 0.1107, "step": 22180 }, { "epoch": 0.56, "learning_rate": 0.0021637565007662737, "loss": 0.1138, "step": 22190 }, { "epoch": 0.56, "learning_rate": 0.002163379644750396, "loss": 0.1144, "step": 22200 }, { "epoch": 0.56, "learning_rate": 0.0021630027887345176, "loss": 0.1129, "step": 22210 }, { "epoch": 0.56, "learning_rate": 0.0021626259327186394, "loss": 0.1146, "step": 22220 }, { "epoch": 0.56, "learning_rate": 0.002162249076702761, "loss": 0.1131, "step": 22230 }, { "epoch": 0.56, "learning_rate": 0.002161872220686883, "loss": 0.1155, "step": 22240 }, { "epoch": 0.56, "learning_rate": 0.002161495364671005, "loss": 0.108, "step": 22250 }, { "epoch": 0.56, "learning_rate": 0.0021611185086551263, "loss": 0.1088, "step": 22260 }, { "epoch": 0.56, "learning_rate": 0.002160741652639248, "loss": 0.1103, "step": 22270 }, { "epoch": 0.56, "learning_rate": 0.0021603647966233703, "loss": 0.1099, "step": 22280 }, { "epoch": 0.56, "learning_rate": 0.002159987940607492, "loss": 0.1122, "step": 22290 }, { "epoch": 0.56, "learning_rate": 0.0021596110845916137, "loss": 0.1144, "step": 22300 }, { "epoch": 0.56, "learning_rate": 0.0021592342285757355, "loss": 0.1127, "step": 22310 }, { "epoch": 0.56, "learning_rate": 0.0021588573725598572, "loss": 0.1123, "step": 22320 }, { "epoch": 0.56, "learning_rate": 0.0021584805165439794, "loss": 0.1154, "step": 22330 }, { "epoch": 0.56, "learning_rate": 0.0021581036605281007, "loss": 0.1109, "step": 22340 }, { "epoch": 0.56, "learning_rate": 0.002157726804512223, "loss": 0.1111, "step": 22350 }, { "epoch": 0.56, "learning_rate": 0.0021573499484963446, "loss": 0.1085, "step": 22360 }, { "epoch": 0.56, "learning_rate": 0.0021569730924804664, "loss": 0.1093, "step": 22370 }, { "epoch": 0.56, "learning_rate": 0.002156596236464588, "loss": 0.1126, "step": 22380 }, { "epoch": 0.56, "learning_rate": 0.00215621938044871, "loss": 0.1108, "step": 22390 }, { "epoch": 0.56, "learning_rate": 0.0021558425244328316, "loss": 0.1084, "step": 22400 }, { "epoch": 0.56, "learning_rate": 0.002155465668416954, "loss": 0.1128, "step": 22410 }, { "epoch": 0.56, "learning_rate": 0.002155088812401075, "loss": 0.1128, "step": 22420 }, { "epoch": 0.56, "learning_rate": 0.0021547119563851973, "loss": 0.112, "step": 22430 }, { "epoch": 0.56, "learning_rate": 0.002154335100369319, "loss": 0.1103, "step": 22440 }, { "epoch": 0.56, "learning_rate": 0.0021539582443534408, "loss": 0.1099, "step": 22450 }, { "epoch": 0.56, "learning_rate": 0.0021535813883375625, "loss": 0.11, "step": 22460 }, { "epoch": 0.56, "learning_rate": 0.0021532045323216843, "loss": 0.1126, "step": 22470 }, { "epoch": 0.56, "learning_rate": 0.002152827676305806, "loss": 0.1111, "step": 22480 }, { "epoch": 0.57, "learning_rate": 0.0021524508202899278, "loss": 0.1072, "step": 22490 }, { "epoch": 0.57, "learning_rate": 0.0021520739642740495, "loss": 0.1144, "step": 22500 }, { "epoch": 0.57, "eval_cer": 0.6664390447192912, "eval_loss": 0.08680952340364456, "eval_runtime": 90.6322, "eval_samples_per_second": 110.325, "eval_steps_per_second": 6.896, "step": 22500 }, { "epoch": 0.57, "learning_rate": 0.0021516971082581717, "loss": 0.1108, "step": 22510 }, { "epoch": 0.57, "learning_rate": 0.0021513202522422934, "loss": 0.1112, "step": 22520 }, { "epoch": 0.57, "learning_rate": 0.002150943396226415, "loss": 0.11, "step": 22530 }, { "epoch": 0.57, "learning_rate": 0.002150566540210537, "loss": 0.1124, "step": 22540 }, { "epoch": 0.57, "learning_rate": 0.0021501896841946587, "loss": 0.1131, "step": 22550 }, { "epoch": 0.57, "learning_rate": 0.002149812828178781, "loss": 0.1093, "step": 22560 }, { "epoch": 0.57, "learning_rate": 0.002149435972162902, "loss": 0.1166, "step": 22570 }, { "epoch": 0.57, "learning_rate": 0.002149059116147024, "loss": 0.1096, "step": 22580 }, { "epoch": 0.57, "learning_rate": 0.002148682260131146, "loss": 0.1121, "step": 22590 }, { "epoch": 0.57, "learning_rate": 0.002148305404115268, "loss": 0.1122, "step": 22600 }, { "epoch": 0.57, "learning_rate": 0.0021479285480993896, "loss": 0.1071, "step": 22610 }, { "epoch": 0.57, "learning_rate": 0.0021475516920835113, "loss": 0.1089, "step": 22620 }, { "epoch": 0.57, "learning_rate": 0.002147174836067633, "loss": 0.1123, "step": 22630 }, { "epoch": 0.57, "learning_rate": 0.0021467979800517552, "loss": 0.1092, "step": 22640 }, { "epoch": 0.57, "learning_rate": 0.0021464211240358765, "loss": 0.1076, "step": 22650 }, { "epoch": 0.57, "learning_rate": 0.0021460442680199987, "loss": 0.1095, "step": 22660 }, { "epoch": 0.57, "learning_rate": 0.0021456674120041205, "loss": 0.1107, "step": 22670 }, { "epoch": 0.57, "learning_rate": 0.002145290555988242, "loss": 0.1099, "step": 22680 }, { "epoch": 0.57, "learning_rate": 0.002144913699972364, "loss": 0.1103, "step": 22690 }, { "epoch": 0.57, "learning_rate": 0.0021445368439564857, "loss": 0.1155, "step": 22700 }, { "epoch": 0.57, "learning_rate": 0.0021441599879406074, "loss": 0.1082, "step": 22710 }, { "epoch": 0.57, "learning_rate": 0.002143783131924729, "loss": 0.1117, "step": 22720 }, { "epoch": 0.57, "learning_rate": 0.002143406275908851, "loss": 0.1089, "step": 22730 }, { "epoch": 0.57, "learning_rate": 0.002143029419892973, "loss": 0.1121, "step": 22740 }, { "epoch": 0.57, "learning_rate": 0.002142652563877095, "loss": 0.1062, "step": 22750 }, { "epoch": 0.57, "learning_rate": 0.0021422757078612166, "loss": 0.1118, "step": 22760 }, { "epoch": 0.57, "learning_rate": 0.0021418988518453383, "loss": 0.1112, "step": 22770 }, { "epoch": 0.57, "learning_rate": 0.00214152199582946, "loss": 0.1119, "step": 22780 }, { "epoch": 0.57, "learning_rate": 0.0021411451398135823, "loss": 0.1151, "step": 22790 }, { "epoch": 0.57, "learning_rate": 0.0021407682837977036, "loss": 0.1126, "step": 22800 }, { "epoch": 0.57, "learning_rate": 0.0021403914277818253, "loss": 0.1119, "step": 22810 }, { "epoch": 0.57, "learning_rate": 0.0021400145717659475, "loss": 0.1179, "step": 22820 }, { "epoch": 0.57, "learning_rate": 0.0021396377157500692, "loss": 0.1097, "step": 22830 }, { "epoch": 0.57, "learning_rate": 0.002139260859734191, "loss": 0.111, "step": 22840 }, { "epoch": 0.57, "learning_rate": 0.0021388840037183127, "loss": 0.1081, "step": 22850 }, { "epoch": 0.57, "learning_rate": 0.0021385071477024345, "loss": 0.1145, "step": 22860 }, { "epoch": 0.57, "learning_rate": 0.0021381302916865567, "loss": 0.1128, "step": 22870 }, { "epoch": 0.57, "learning_rate": 0.002137753435670678, "loss": 0.1095, "step": 22880 }, { "epoch": 0.58, "learning_rate": 0.0021373765796547997, "loss": 0.1125, "step": 22890 }, { "epoch": 0.58, "learning_rate": 0.002136999723638922, "loss": 0.1108, "step": 22900 }, { "epoch": 0.58, "learning_rate": 0.0021366228676230436, "loss": 0.1148, "step": 22910 }, { "epoch": 0.58, "learning_rate": 0.0021362460116071654, "loss": 0.1093, "step": 22920 }, { "epoch": 0.58, "learning_rate": 0.002135869155591287, "loss": 0.11, "step": 22930 }, { "epoch": 0.58, "learning_rate": 0.002135492299575409, "loss": 0.1082, "step": 22940 }, { "epoch": 0.58, "learning_rate": 0.0021351154435595306, "loss": 0.1119, "step": 22950 }, { "epoch": 0.58, "learning_rate": 0.0021347385875436524, "loss": 0.1127, "step": 22960 }, { "epoch": 0.58, "learning_rate": 0.0021343617315277745, "loss": 0.1118, "step": 22970 }, { "epoch": 0.58, "learning_rate": 0.0021339848755118963, "loss": 0.1102, "step": 22980 }, { "epoch": 0.58, "learning_rate": 0.0021336080194960176, "loss": 0.111, "step": 22990 }, { "epoch": 0.58, "learning_rate": 0.0021332311634801398, "loss": 0.1132, "step": 23000 }, { "epoch": 0.58, "eval_cer": 0.6665848575101047, "eval_loss": 0.08576372265815735, "eval_runtime": 90.6462, "eval_samples_per_second": 110.308, "eval_steps_per_second": 6.895, "step": 23000 }, { "epoch": 0.58, "learning_rate": 0.0021328543074642615, "loss": 0.1111, "step": 23010 }, { "epoch": 0.58, "learning_rate": 0.0021324774514483833, "loss": 0.109, "step": 23020 }, { "epoch": 0.58, "learning_rate": 0.002132100595432505, "loss": 0.109, "step": 23030 }, { "epoch": 0.58, "learning_rate": 0.0021317237394166267, "loss": 0.1102, "step": 23040 }, { "epoch": 0.58, "learning_rate": 0.002131346883400749, "loss": 0.1135, "step": 23050 }, { "epoch": 0.58, "learning_rate": 0.0021309700273848707, "loss": 0.1128, "step": 23060 }, { "epoch": 0.58, "learning_rate": 0.0021305931713689924, "loss": 0.1107, "step": 23070 }, { "epoch": 0.58, "learning_rate": 0.002130216315353114, "loss": 0.1085, "step": 23080 }, { "epoch": 0.58, "learning_rate": 0.002129839459337236, "loss": 0.1109, "step": 23090 }, { "epoch": 0.58, "learning_rate": 0.002129462603321358, "loss": 0.1117, "step": 23100 }, { "epoch": 0.58, "learning_rate": 0.0021290857473054794, "loss": 0.1074, "step": 23110 }, { "epoch": 0.58, "learning_rate": 0.002128708891289601, "loss": 0.1093, "step": 23120 }, { "epoch": 0.58, "learning_rate": 0.0021283320352737233, "loss": 0.1067, "step": 23130 }, { "epoch": 0.58, "learning_rate": 0.0021279551792578446, "loss": 0.1132, "step": 23140 }, { "epoch": 0.58, "learning_rate": 0.002127578323241967, "loss": 0.1059, "step": 23150 }, { "epoch": 0.58, "learning_rate": 0.0021272014672260886, "loss": 0.1103, "step": 23160 }, { "epoch": 0.58, "learning_rate": 0.0021268246112102103, "loss": 0.1079, "step": 23170 }, { "epoch": 0.58, "learning_rate": 0.002126447755194332, "loss": 0.1082, "step": 23180 }, { "epoch": 0.58, "learning_rate": 0.002126070899178454, "loss": 0.1061, "step": 23190 }, { "epoch": 0.58, "learning_rate": 0.002125694043162576, "loss": 0.1124, "step": 23200 }, { "epoch": 0.58, "learning_rate": 0.0021253171871466977, "loss": 0.1113, "step": 23210 }, { "epoch": 0.58, "learning_rate": 0.002124940331130819, "loss": 0.1055, "step": 23220 }, { "epoch": 0.58, "learning_rate": 0.002124563475114941, "loss": 0.1137, "step": 23230 }, { "epoch": 0.58, "learning_rate": 0.002124186619099063, "loss": 0.112, "step": 23240 }, { "epoch": 0.58, "learning_rate": 0.0021238097630831847, "loss": 0.1043, "step": 23250 }, { "epoch": 0.58, "learning_rate": 0.0021234329070673064, "loss": 0.1094, "step": 23260 }, { "epoch": 0.58, "learning_rate": 0.002123056051051428, "loss": 0.1123, "step": 23270 }, { "epoch": 0.58, "learning_rate": 0.0021226791950355504, "loss": 0.1087, "step": 23280 }, { "epoch": 0.59, "learning_rate": 0.002122302339019672, "loss": 0.1161, "step": 23290 }, { "epoch": 0.59, "learning_rate": 0.0021219254830037934, "loss": 0.1083, "step": 23300 }, { "epoch": 0.59, "learning_rate": 0.0021215486269879156, "loss": 0.1095, "step": 23310 }, { "epoch": 0.59, "learning_rate": 0.0021211717709720373, "loss": 0.1109, "step": 23320 }, { "epoch": 0.59, "learning_rate": 0.002120794914956159, "loss": 0.1116, "step": 23330 }, { "epoch": 0.59, "learning_rate": 0.002120418058940281, "loss": 0.1127, "step": 23340 }, { "epoch": 0.59, "learning_rate": 0.0021200412029244026, "loss": 0.109, "step": 23350 }, { "epoch": 0.59, "learning_rate": 0.0021196643469085247, "loss": 0.1046, "step": 23360 }, { "epoch": 0.59, "learning_rate": 0.002119287490892646, "loss": 0.1071, "step": 23370 }, { "epoch": 0.59, "learning_rate": 0.0021189106348767682, "loss": 0.1146, "step": 23380 }, { "epoch": 0.59, "learning_rate": 0.00211853377886089, "loss": 0.1081, "step": 23390 }, { "epoch": 0.59, "learning_rate": 0.0021181569228450117, "loss": 0.109, "step": 23400 }, { "epoch": 0.59, "learning_rate": 0.0021177800668291335, "loss": 0.1042, "step": 23410 }, { "epoch": 0.59, "learning_rate": 0.002117403210813255, "loss": 0.109, "step": 23420 }, { "epoch": 0.59, "learning_rate": 0.002117026354797377, "loss": 0.1113, "step": 23430 }, { "epoch": 0.59, "learning_rate": 0.002116649498781499, "loss": 0.1092, "step": 23440 }, { "epoch": 0.59, "learning_rate": 0.0021162726427656204, "loss": 0.1081, "step": 23450 }, { "epoch": 0.59, "learning_rate": 0.0021158957867497426, "loss": 0.1092, "step": 23460 }, { "epoch": 0.59, "learning_rate": 0.0021155189307338644, "loss": 0.1102, "step": 23470 }, { "epoch": 0.59, "learning_rate": 0.002115142074717986, "loss": 0.1068, "step": 23480 }, { "epoch": 0.59, "learning_rate": 0.002114765218702108, "loss": 0.1131, "step": 23490 }, { "epoch": 0.59, "learning_rate": 0.0021143883626862296, "loss": 0.1073, "step": 23500 }, { "epoch": 0.59, "eval_cer": 0.6666681103576648, "eval_loss": 0.08526523411273956, "eval_runtime": 90.7857, "eval_samples_per_second": 110.138, "eval_steps_per_second": 6.884, "step": 23500 }, { "epoch": 0.59, "learning_rate": 0.0021140115066703518, "loss": 0.1107, "step": 23510 }, { "epoch": 0.59, "learning_rate": 0.0021136346506544735, "loss": 0.1094, "step": 23520 }, { "epoch": 0.59, "learning_rate": 0.002113257794638595, "loss": 0.1098, "step": 23530 }, { "epoch": 0.59, "learning_rate": 0.002112880938622717, "loss": 0.1093, "step": 23540 }, { "epoch": 0.59, "learning_rate": 0.0021125040826068388, "loss": 0.1112, "step": 23550 }, { "epoch": 0.59, "learning_rate": 0.0021121272265909605, "loss": 0.1123, "step": 23560 }, { "epoch": 0.59, "learning_rate": 0.0021117503705750823, "loss": 0.1089, "step": 23570 }, { "epoch": 0.59, "learning_rate": 0.002111373514559204, "loss": 0.1085, "step": 23580 }, { "epoch": 0.59, "learning_rate": 0.002110996658543326, "loss": 0.1095, "step": 23590 }, { "epoch": 0.59, "learning_rate": 0.0021106198025274475, "loss": 0.1061, "step": 23600 }, { "epoch": 0.59, "learning_rate": 0.0021102429465115697, "loss": 0.1114, "step": 23610 }, { "epoch": 0.59, "learning_rate": 0.0021098660904956914, "loss": 0.1127, "step": 23620 }, { "epoch": 0.59, "learning_rate": 0.002109489234479813, "loss": 0.1056, "step": 23630 }, { "epoch": 0.59, "learning_rate": 0.002109112378463935, "loss": 0.1092, "step": 23640 }, { "epoch": 0.59, "learning_rate": 0.0021087355224480566, "loss": 0.111, "step": 23650 }, { "epoch": 0.59, "learning_rate": 0.0021083586664321784, "loss": 0.1074, "step": 23660 }, { "epoch": 0.59, "learning_rate": 0.0021079818104163006, "loss": 0.1045, "step": 23670 }, { "epoch": 0.59, "learning_rate": 0.002107604954400422, "loss": 0.1101, "step": 23680 }, { "epoch": 0.6, "learning_rate": 0.002107228098384544, "loss": 0.1071, "step": 23690 }, { "epoch": 0.6, "learning_rate": 0.002106851242368666, "loss": 0.1107, "step": 23700 }, { "epoch": 0.6, "learning_rate": 0.0021064743863527875, "loss": 0.1095, "step": 23710 }, { "epoch": 0.6, "learning_rate": 0.0021060975303369093, "loss": 0.1113, "step": 23720 }, { "epoch": 0.6, "learning_rate": 0.002105720674321031, "loss": 0.108, "step": 23730 }, { "epoch": 0.6, "learning_rate": 0.0021053438183051528, "loss": 0.1056, "step": 23740 }, { "epoch": 0.6, "learning_rate": 0.002104966962289275, "loss": 0.1141, "step": 23750 }, { "epoch": 0.6, "learning_rate": 0.0021045901062733963, "loss": 0.1052, "step": 23760 }, { "epoch": 0.6, "learning_rate": 0.0021042132502575184, "loss": 0.1061, "step": 23770 }, { "epoch": 0.6, "learning_rate": 0.00210383639424164, "loss": 0.1064, "step": 23780 }, { "epoch": 0.6, "learning_rate": 0.002103459538225762, "loss": 0.1076, "step": 23790 }, { "epoch": 0.6, "learning_rate": 0.0021030826822098837, "loss": 0.1076, "step": 23800 }, { "epoch": 0.6, "learning_rate": 0.0021027058261940054, "loss": 0.1113, "step": 23810 }, { "epoch": 0.6, "learning_rate": 0.0021023289701781276, "loss": 0.1066, "step": 23820 }, { "epoch": 0.6, "learning_rate": 0.002101952114162249, "loss": 0.1064, "step": 23830 }, { "epoch": 0.6, "learning_rate": 0.0021015752581463707, "loss": 0.1085, "step": 23840 }, { "epoch": 0.6, "learning_rate": 0.002101198402130493, "loss": 0.1094, "step": 23850 }, { "epoch": 0.6, "learning_rate": 0.0021008215461146146, "loss": 0.1076, "step": 23860 }, { "epoch": 0.6, "learning_rate": 0.0021004446900987363, "loss": 0.1085, "step": 23870 }, { "epoch": 0.6, "learning_rate": 0.002100067834082858, "loss": 0.1075, "step": 23880 }, { "epoch": 0.6, "learning_rate": 0.00209969097806698, "loss": 0.1099, "step": 23890 }, { "epoch": 0.6, "learning_rate": 0.002099314122051102, "loss": 0.1092, "step": 23900 }, { "epoch": 0.6, "learning_rate": 0.0020989372660352233, "loss": 0.1071, "step": 23910 }, { "epoch": 0.6, "learning_rate": 0.0020985604100193455, "loss": 0.1099, "step": 23920 }, { "epoch": 0.6, "learning_rate": 0.0020981835540034672, "loss": 0.1094, "step": 23930 }, { "epoch": 0.6, "learning_rate": 0.002097806697987589, "loss": 0.1079, "step": 23940 }, { "epoch": 0.6, "learning_rate": 0.0020974298419717107, "loss": 0.1082, "step": 23950 }, { "epoch": 0.6, "learning_rate": 0.0020970529859558325, "loss": 0.1109, "step": 23960 }, { "epoch": 0.6, "learning_rate": 0.002096676129939954, "loss": 0.1072, "step": 23970 }, { "epoch": 0.6, "learning_rate": 0.0020962992739240764, "loss": 0.108, "step": 23980 }, { "epoch": 0.6, "learning_rate": 0.0020959224179081977, "loss": 0.1085, "step": 23990 }, { "epoch": 0.6, "learning_rate": 0.00209554556189232, "loss": 0.109, "step": 24000 }, { "epoch": 0.6, "eval_cer": 0.6662922694678122, "eval_loss": 0.08452539891004562, "eval_runtime": 90.7194, "eval_samples_per_second": 110.219, "eval_steps_per_second": 6.889, "step": 24000 }, { "epoch": 0.6, "learning_rate": 0.0020951687058764416, "loss": 0.1087, "step": 24010 }, { "epoch": 0.6, "learning_rate": 0.0020947918498605634, "loss": 0.111, "step": 24020 }, { "epoch": 0.6, "learning_rate": 0.002094414993844685, "loss": 0.1099, "step": 24030 }, { "epoch": 0.6, "learning_rate": 0.002094038137828807, "loss": 0.1096, "step": 24040 }, { "epoch": 0.6, "learning_rate": 0.0020936612818129286, "loss": 0.1041, "step": 24050 }, { "epoch": 0.6, "learning_rate": 0.0020932844257970503, "loss": 0.1044, "step": 24060 }, { "epoch": 0.6, "learning_rate": 0.002092907569781172, "loss": 0.1058, "step": 24070 }, { "epoch": 0.6, "learning_rate": 0.0020925307137652943, "loss": 0.106, "step": 24080 }, { "epoch": 0.61, "learning_rate": 0.002092153857749416, "loss": 0.1091, "step": 24090 }, { "epoch": 0.61, "learning_rate": 0.0020917770017335378, "loss": 0.1052, "step": 24100 }, { "epoch": 0.61, "learning_rate": 0.0020914001457176595, "loss": 0.1083, "step": 24110 }, { "epoch": 0.61, "learning_rate": 0.0020910232897017812, "loss": 0.1049, "step": 24120 }, { "epoch": 0.61, "learning_rate": 0.0020906464336859034, "loss": 0.1098, "step": 24130 }, { "epoch": 0.61, "learning_rate": 0.0020902695776700247, "loss": 0.1041, "step": 24140 }, { "epoch": 0.61, "learning_rate": 0.0020898927216541465, "loss": 0.1064, "step": 24150 }, { "epoch": 0.61, "learning_rate": 0.0020895158656382687, "loss": 0.1094, "step": 24160 }, { "epoch": 0.61, "learning_rate": 0.0020891390096223904, "loss": 0.1075, "step": 24170 }, { "epoch": 0.61, "learning_rate": 0.002088762153606512, "loss": 0.1095, "step": 24180 }, { "epoch": 0.61, "learning_rate": 0.002088385297590634, "loss": 0.1089, "step": 24190 }, { "epoch": 0.61, "learning_rate": 0.0020880084415747556, "loss": 0.1085, "step": 24200 }, { "epoch": 0.61, "learning_rate": 0.002087631585558878, "loss": 0.1145, "step": 24210 }, { "epoch": 0.61, "learning_rate": 0.002087254729542999, "loss": 0.1065, "step": 24220 }, { "epoch": 0.61, "learning_rate": 0.0020868778735271213, "loss": 0.1084, "step": 24230 }, { "epoch": 0.61, "learning_rate": 0.002086501017511243, "loss": 0.1005, "step": 24240 }, { "epoch": 0.61, "learning_rate": 0.002086124161495365, "loss": 0.108, "step": 24250 }, { "epoch": 0.61, "learning_rate": 0.0020857473054794865, "loss": 0.103, "step": 24260 }, { "epoch": 0.61, "learning_rate": 0.0020853704494636083, "loss": 0.1106, "step": 24270 }, { "epoch": 0.61, "learning_rate": 0.00208499359344773, "loss": 0.1071, "step": 24280 }, { "epoch": 0.61, "learning_rate": 0.0020846167374318518, "loss": 0.1054, "step": 24290 }, { "epoch": 0.61, "learning_rate": 0.0020842398814159735, "loss": 0.1085, "step": 24300 }, { "epoch": 0.61, "learning_rate": 0.0020838630254000957, "loss": 0.1067, "step": 24310 }, { "epoch": 0.61, "learning_rate": 0.0020834861693842174, "loss": 0.1058, "step": 24320 }, { "epoch": 0.61, "learning_rate": 0.002083109313368339, "loss": 0.1079, "step": 24330 }, { "epoch": 0.61, "learning_rate": 0.002082732457352461, "loss": 0.1084, "step": 24340 }, { "epoch": 0.61, "learning_rate": 0.0020823556013365827, "loss": 0.1096, "step": 24350 }, { "epoch": 0.61, "learning_rate": 0.002081978745320705, "loss": 0.1084, "step": 24360 }, { "epoch": 0.61, "learning_rate": 0.002081601889304826, "loss": 0.1093, "step": 24370 }, { "epoch": 0.61, "learning_rate": 0.002081225033288948, "loss": 0.106, "step": 24380 }, { "epoch": 0.61, "learning_rate": 0.00208084817727307, "loss": 0.1097, "step": 24390 }, { "epoch": 0.61, "learning_rate": 0.002080471321257192, "loss": 0.1105, "step": 24400 }, { "epoch": 0.61, "learning_rate": 0.0020800944652413136, "loss": 0.1031, "step": 24410 }, { "epoch": 0.61, "learning_rate": 0.0020797176092254353, "loss": 0.1092, "step": 24420 }, { "epoch": 0.61, "learning_rate": 0.002079340753209557, "loss": 0.1081, "step": 24430 }, { "epoch": 0.61, "learning_rate": 0.0020789638971936792, "loss": 0.1044, "step": 24440 }, { "epoch": 0.61, "learning_rate": 0.0020785870411778005, "loss": 0.1106, "step": 24450 }, { "epoch": 0.61, "learning_rate": 0.0020782101851619223, "loss": 0.1071, "step": 24460 }, { "epoch": 0.61, "learning_rate": 0.0020778333291460445, "loss": 0.1115, "step": 24470 }, { "epoch": 0.62, "learning_rate": 0.0020774564731301658, "loss": 0.1085, "step": 24480 }, { "epoch": 0.62, "learning_rate": 0.002077079617114288, "loss": 0.1038, "step": 24490 }, { "epoch": 0.62, "learning_rate": 0.0020767027610984097, "loss": 0.1073, "step": 24500 }, { "epoch": 0.62, "eval_cer": 0.6662446276648731, "eval_loss": 0.0842297375202179, "eval_runtime": 90.7825, "eval_samples_per_second": 110.142, "eval_steps_per_second": 6.885, "step": 24500 }, { "epoch": 0.62, "learning_rate": 0.0020763259050825314, "loss": 0.1039, "step": 24510 }, { "epoch": 0.62, "learning_rate": 0.002075949049066653, "loss": 0.1047, "step": 24520 }, { "epoch": 0.62, "learning_rate": 0.002075572193050775, "loss": 0.1053, "step": 24530 }, { "epoch": 0.62, "learning_rate": 0.002075195337034897, "loss": 0.1017, "step": 24540 }, { "epoch": 0.62, "learning_rate": 0.002074818481019019, "loss": 0.1053, "step": 24550 }, { "epoch": 0.62, "learning_rate": 0.00207444162500314, "loss": 0.1045, "step": 24560 }, { "epoch": 0.62, "learning_rate": 0.0020740647689872624, "loss": 0.1002, "step": 24570 }, { "epoch": 0.62, "learning_rate": 0.002073687912971384, "loss": 0.1062, "step": 24580 }, { "epoch": 0.62, "learning_rate": 0.002073311056955506, "loss": 0.1074, "step": 24590 }, { "epoch": 0.62, "learning_rate": 0.0020729342009396276, "loss": 0.1043, "step": 24600 }, { "epoch": 0.62, "learning_rate": 0.0020725573449237493, "loss": 0.1087, "step": 24610 }, { "epoch": 0.62, "learning_rate": 0.0020721804889078715, "loss": 0.1081, "step": 24620 }, { "epoch": 0.62, "learning_rate": 0.0020718036328919933, "loss": 0.1067, "step": 24630 }, { "epoch": 0.62, "learning_rate": 0.002071426776876115, "loss": 0.1084, "step": 24640 }, { "epoch": 0.62, "learning_rate": 0.0020710499208602367, "loss": 0.1083, "step": 24650 }, { "epoch": 0.62, "learning_rate": 0.0020706730648443585, "loss": 0.1072, "step": 24660 }, { "epoch": 0.62, "learning_rate": 0.0020702962088284807, "loss": 0.1063, "step": 24670 }, { "epoch": 0.62, "learning_rate": 0.002069919352812602, "loss": 0.1022, "step": 24680 }, { "epoch": 0.62, "learning_rate": 0.0020695424967967237, "loss": 0.1075, "step": 24690 }, { "epoch": 0.62, "learning_rate": 0.002069165640780846, "loss": 0.1082, "step": 24700 }, { "epoch": 0.62, "learning_rate": 0.002068788784764967, "loss": 0.1053, "step": 24710 }, { "epoch": 0.62, "learning_rate": 0.0020684119287490894, "loss": 0.1078, "step": 24720 }, { "epoch": 0.62, "learning_rate": 0.002068035072733211, "loss": 0.1086, "step": 24730 }, { "epoch": 0.62, "learning_rate": 0.002067658216717333, "loss": 0.1062, "step": 24740 }, { "epoch": 0.62, "learning_rate": 0.0020672813607014546, "loss": 0.1093, "step": 24750 }, { "epoch": 0.62, "learning_rate": 0.0020669045046855764, "loss": 0.1075, "step": 24760 }, { "epoch": 0.62, "learning_rate": 0.0020665276486696985, "loss": 0.104, "step": 24770 }, { "epoch": 0.62, "learning_rate": 0.0020661507926538203, "loss": 0.1061, "step": 24780 }, { "epoch": 0.62, "learning_rate": 0.0020657739366379416, "loss": 0.1052, "step": 24790 }, { "epoch": 0.62, "learning_rate": 0.0020653970806220638, "loss": 0.1068, "step": 24800 }, { "epoch": 0.62, "learning_rate": 0.0020650202246061855, "loss": 0.1067, "step": 24810 }, { "epoch": 0.62, "learning_rate": 0.0020646433685903073, "loss": 0.1059, "step": 24820 }, { "epoch": 0.62, "learning_rate": 0.002064266512574429, "loss": 0.1069, "step": 24830 }, { "epoch": 0.62, "learning_rate": 0.0020638896565585508, "loss": 0.1024, "step": 24840 }, { "epoch": 0.62, "learning_rate": 0.002063512800542673, "loss": 0.1061, "step": 24850 }, { "epoch": 0.62, "learning_rate": 0.0020631359445267947, "loss": 0.1087, "step": 24860 }, { "epoch": 0.62, "learning_rate": 0.002062759088510916, "loss": 0.1065, "step": 24870 }, { "epoch": 0.63, "learning_rate": 0.002062382232495038, "loss": 0.1048, "step": 24880 }, { "epoch": 0.63, "learning_rate": 0.00206200537647916, "loss": 0.1081, "step": 24890 }, { "epoch": 0.63, "learning_rate": 0.0020616285204632817, "loss": 0.1052, "step": 24900 }, { "epoch": 0.63, "learning_rate": 0.0020612516644474034, "loss": 0.1043, "step": 24910 }, { "epoch": 0.63, "learning_rate": 0.002060874808431525, "loss": 0.1082, "step": 24920 }, { "epoch": 0.63, "learning_rate": 0.0020604979524156473, "loss": 0.1031, "step": 24930 }, { "epoch": 0.63, "learning_rate": 0.0020601210963997686, "loss": 0.1079, "step": 24940 }, { "epoch": 0.63, "learning_rate": 0.002059744240383891, "loss": 0.1063, "step": 24950 }, { "epoch": 0.63, "learning_rate": 0.0020593673843680126, "loss": 0.1017, "step": 24960 }, { "epoch": 0.63, "learning_rate": 0.0020589905283521343, "loss": 0.1105, "step": 24970 }, { "epoch": 0.63, "learning_rate": 0.002058613672336256, "loss": 0.1095, "step": 24980 }, { "epoch": 0.63, "learning_rate": 0.002058236816320378, "loss": 0.1111, "step": 24990 }, { "epoch": 0.63, "learning_rate": 0.0020578599603044995, "loss": 0.1062, "step": 25000 }, { "epoch": 0.63, "eval_cer": 0.6662200849179045, "eval_loss": 0.0830809623003006, "eval_runtime": 90.7235, "eval_samples_per_second": 110.214, "eval_steps_per_second": 6.889, "step": 25000 }, { "epoch": 0.63, "learning_rate": 0.0020574831042886217, "loss": 0.1057, "step": 25010 }, { "epoch": 0.63, "learning_rate": 0.002057106248272743, "loss": 0.107, "step": 25020 }, { "epoch": 0.63, "learning_rate": 0.002056729392256865, "loss": 0.107, "step": 25030 }, { "epoch": 0.63, "learning_rate": 0.002056352536240987, "loss": 0.109, "step": 25040 }, { "epoch": 0.63, "learning_rate": 0.0020559756802251087, "loss": 0.1029, "step": 25050 }, { "epoch": 0.63, "learning_rate": 0.0020555988242092304, "loss": 0.1044, "step": 25060 }, { "epoch": 0.63, "learning_rate": 0.002055221968193352, "loss": 0.1039, "step": 25070 }, { "epoch": 0.63, "learning_rate": 0.0020548451121774744, "loss": 0.1063, "step": 25080 }, { "epoch": 0.63, "learning_rate": 0.002054468256161596, "loss": 0.1064, "step": 25090 }, { "epoch": 0.63, "learning_rate": 0.0020540914001457174, "loss": 0.1046, "step": 25100 }, { "epoch": 0.63, "learning_rate": 0.0020537145441298396, "loss": 0.1034, "step": 25110 }, { "epoch": 0.63, "learning_rate": 0.0020533376881139613, "loss": 0.1062, "step": 25120 }, { "epoch": 0.63, "learning_rate": 0.002052960832098083, "loss": 0.1068, "step": 25130 }, { "epoch": 0.63, "learning_rate": 0.002052583976082205, "loss": 0.1041, "step": 25140 }, { "epoch": 0.63, "learning_rate": 0.0020522071200663266, "loss": 0.1065, "step": 25150 }, { "epoch": 0.63, "learning_rate": 0.0020518302640504488, "loss": 0.1041, "step": 25160 }, { "epoch": 0.63, "learning_rate": 0.00205145340803457, "loss": 0.1073, "step": 25170 }, { "epoch": 0.63, "learning_rate": 0.0020510765520186922, "loss": 0.1049, "step": 25180 }, { "epoch": 0.63, "learning_rate": 0.002050699696002814, "loss": 0.1037, "step": 25190 }, { "epoch": 0.63, "learning_rate": 0.0020503228399869357, "loss": 0.1044, "step": 25200 }, { "epoch": 0.63, "learning_rate": 0.0020499459839710575, "loss": 0.1079, "step": 25210 }, { "epoch": 0.63, "learning_rate": 0.0020495691279551792, "loss": 0.103, "step": 25220 }, { "epoch": 0.63, "learning_rate": 0.002049192271939301, "loss": 0.1066, "step": 25230 }, { "epoch": 0.63, "learning_rate": 0.002048815415923423, "loss": 0.1085, "step": 25240 }, { "epoch": 0.63, "learning_rate": 0.0020484385599075445, "loss": 0.1048, "step": 25250 }, { "epoch": 0.63, "learning_rate": 0.0020480617038916666, "loss": 0.1102, "step": 25260 }, { "epoch": 0.63, "learning_rate": 0.0020476848478757884, "loss": 0.1088, "step": 25270 }, { "epoch": 0.64, "learning_rate": 0.00204730799185991, "loss": 0.1043, "step": 25280 }, { "epoch": 0.64, "learning_rate": 0.002046931135844032, "loss": 0.1093, "step": 25290 }, { "epoch": 0.64, "learning_rate": 0.0020465542798281536, "loss": 0.1037, "step": 25300 }, { "epoch": 0.64, "learning_rate": 0.0020461774238122754, "loss": 0.1057, "step": 25310 }, { "epoch": 0.64, "learning_rate": 0.0020458005677963975, "loss": 0.1083, "step": 25320 }, { "epoch": 0.64, "learning_rate": 0.002045423711780519, "loss": 0.1039, "step": 25330 }, { "epoch": 0.64, "learning_rate": 0.002045046855764641, "loss": 0.1075, "step": 25340 }, { "epoch": 0.64, "learning_rate": 0.0020446699997487628, "loss": 0.1023, "step": 25350 }, { "epoch": 0.64, "learning_rate": 0.0020442931437328845, "loss": 0.1043, "step": 25360 }, { "epoch": 0.64, "learning_rate": 0.0020439162877170063, "loss": 0.1027, "step": 25370 }, { "epoch": 0.64, "learning_rate": 0.002043539431701128, "loss": 0.106, "step": 25380 }, { "epoch": 0.64, "learning_rate": 0.00204316257568525, "loss": 0.1073, "step": 25390 }, { "epoch": 0.64, "learning_rate": 0.0020427857196693715, "loss": 0.1105, "step": 25400 }, { "epoch": 0.64, "learning_rate": 0.0020424088636534932, "loss": 0.1081, "step": 25410 }, { "epoch": 0.64, "learning_rate": 0.0020420320076376154, "loss": 0.104, "step": 25420 }, { "epoch": 0.64, "learning_rate": 0.002041655151621737, "loss": 0.104, "step": 25430 }, { "epoch": 0.64, "learning_rate": 0.002041278295605859, "loss": 0.1032, "step": 25440 }, { "epoch": 0.64, "learning_rate": 0.0020409014395899806, "loss": 0.1035, "step": 25450 }, { "epoch": 0.64, "learning_rate": 0.0020405245835741024, "loss": 0.1042, "step": 25460 }, { "epoch": 0.64, "learning_rate": 0.0020401477275582246, "loss": 0.1058, "step": 25470 }, { "epoch": 0.64, "learning_rate": 0.002039770871542346, "loss": 0.1043, "step": 25480 }, { "epoch": 0.64, "learning_rate": 0.002039394015526468, "loss": 0.1057, "step": 25490 }, { "epoch": 0.64, "learning_rate": 0.00203901715951059, "loss": 0.1018, "step": 25500 }, { "epoch": 0.64, "eval_cer": 0.6662013169349286, "eval_loss": 0.08301563560962677, "eval_runtime": 90.6697, "eval_samples_per_second": 110.279, "eval_steps_per_second": 6.893, "step": 25500 }, { "epoch": 0.64, "learning_rate": 0.0020386403034947116, "loss": 0.104, "step": 25510 }, { "epoch": 0.64, "learning_rate": 0.0020382634474788333, "loss": 0.1074, "step": 25520 }, { "epoch": 0.64, "learning_rate": 0.002037886591462955, "loss": 0.1081, "step": 25530 }, { "epoch": 0.64, "learning_rate": 0.002037509735447077, "loss": 0.104, "step": 25540 }, { "epoch": 0.64, "learning_rate": 0.002037132879431199, "loss": 0.1028, "step": 25550 }, { "epoch": 0.64, "learning_rate": 0.0020367560234153203, "loss": 0.1061, "step": 25560 }, { "epoch": 0.64, "learning_rate": 0.0020363791673994425, "loss": 0.1077, "step": 25570 }, { "epoch": 0.64, "learning_rate": 0.002036002311383564, "loss": 0.1092, "step": 25580 }, { "epoch": 0.64, "learning_rate": 0.002035625455367686, "loss": 0.1062, "step": 25590 }, { "epoch": 0.64, "learning_rate": 0.0020352485993518077, "loss": 0.1037, "step": 25600 }, { "epoch": 0.64, "learning_rate": 0.0020348717433359294, "loss": 0.1011, "step": 25610 }, { "epoch": 0.64, "learning_rate": 0.002034494887320051, "loss": 0.1059, "step": 25620 }, { "epoch": 0.64, "learning_rate": 0.002034118031304173, "loss": 0.1126, "step": 25630 }, { "epoch": 0.64, "learning_rate": 0.0020337411752882947, "loss": 0.105, "step": 25640 }, { "epoch": 0.64, "learning_rate": 0.002033364319272417, "loss": 0.1067, "step": 25650 }, { "epoch": 0.64, "learning_rate": 0.0020329874632565386, "loss": 0.1051, "step": 25660 }, { "epoch": 0.64, "learning_rate": 0.0020326106072406603, "loss": 0.102, "step": 25670 }, { "epoch": 0.65, "learning_rate": 0.002032233751224782, "loss": 0.1073, "step": 25680 }, { "epoch": 0.65, "learning_rate": 0.002031856895208904, "loss": 0.105, "step": 25690 }, { "epoch": 0.65, "learning_rate": 0.002031480039193026, "loss": 0.105, "step": 25700 }, { "epoch": 0.65, "learning_rate": 0.0020311031831771473, "loss": 0.106, "step": 25710 }, { "epoch": 0.65, "learning_rate": 0.002030726327161269, "loss": 0.1013, "step": 25720 }, { "epoch": 0.65, "learning_rate": 0.0020303494711453912, "loss": 0.1043, "step": 25730 }, { "epoch": 0.65, "learning_rate": 0.002029972615129513, "loss": 0.1061, "step": 25740 }, { "epoch": 0.65, "learning_rate": 0.0020295957591136347, "loss": 0.1047, "step": 25750 }, { "epoch": 0.65, "learning_rate": 0.0020292189030977565, "loss": 0.104, "step": 25760 }, { "epoch": 0.65, "learning_rate": 0.002028842047081878, "loss": 0.1056, "step": 25770 }, { "epoch": 0.65, "learning_rate": 0.0020284651910660004, "loss": 0.106, "step": 25780 }, { "epoch": 0.65, "learning_rate": 0.0020280883350501217, "loss": 0.105, "step": 25790 }, { "epoch": 0.65, "learning_rate": 0.002027711479034244, "loss": 0.1049, "step": 25800 }, { "epoch": 0.65, "learning_rate": 0.0020273346230183656, "loss": 0.1061, "step": 25810 }, { "epoch": 0.65, "learning_rate": 0.002026957767002487, "loss": 0.1009, "step": 25820 }, { "epoch": 0.65, "learning_rate": 0.002026580910986609, "loss": 0.1066, "step": 25830 }, { "epoch": 0.65, "learning_rate": 0.002026204054970731, "loss": 0.108, "step": 25840 }, { "epoch": 0.65, "learning_rate": 0.0020258271989548526, "loss": 0.102, "step": 25850 }, { "epoch": 0.65, "learning_rate": 0.0020254503429389743, "loss": 0.1052, "step": 25860 }, { "epoch": 0.65, "learning_rate": 0.002025073486923096, "loss": 0.1013, "step": 25870 }, { "epoch": 0.65, "learning_rate": 0.0020246966309072183, "loss": 0.1034, "step": 25880 }, { "epoch": 0.65, "learning_rate": 0.00202431977489134, "loss": 0.1061, "step": 25890 }, { "epoch": 0.65, "learning_rate": 0.0020239429188754618, "loss": 0.1032, "step": 25900 }, { "epoch": 0.65, "learning_rate": 0.0020235660628595835, "loss": 0.1068, "step": 25910 }, { "epoch": 0.65, "learning_rate": 0.0020231892068437052, "loss": 0.1042, "step": 25920 }, { "epoch": 0.65, "learning_rate": 0.0020228123508278274, "loss": 0.106, "step": 25930 }, { "epoch": 0.65, "learning_rate": 0.0020224354948119487, "loss": 0.1053, "step": 25940 }, { "epoch": 0.65, "learning_rate": 0.0020220586387960705, "loss": 0.1049, "step": 25950 }, { "epoch": 0.65, "learning_rate": 0.0020216817827801927, "loss": 0.1066, "step": 25960 }, { "epoch": 0.65, "learning_rate": 0.0020213049267643144, "loss": 0.1051, "step": 25970 }, { "epoch": 0.65, "learning_rate": 0.002020928070748436, "loss": 0.1068, "step": 25980 }, { "epoch": 0.65, "learning_rate": 0.002020551214732558, "loss": 0.1025, "step": 25990 }, { "epoch": 0.65, "learning_rate": 0.0020201743587166796, "loss": 0.1052, "step": 26000 }, { "epoch": 0.65, "eval_cer": 0.6666334617737092, "eval_loss": 0.08180632442235947, "eval_runtime": 90.778, "eval_samples_per_second": 110.148, "eval_steps_per_second": 6.885, "step": 26000 }, { "epoch": 0.65, "learning_rate": 0.002019797502700802, "loss": 0.108, "step": 26010 }, { "epoch": 0.65, "learning_rate": 0.002019420646684923, "loss": 0.1042, "step": 26020 }, { "epoch": 0.65, "learning_rate": 0.002019043790669045, "loss": 0.1014, "step": 26030 }, { "epoch": 0.65, "learning_rate": 0.002018666934653167, "loss": 0.1059, "step": 26040 }, { "epoch": 0.65, "learning_rate": 0.0020182900786372884, "loss": 0.1055, "step": 26050 }, { "epoch": 0.65, "learning_rate": 0.0020179132226214105, "loss": 0.1078, "step": 26060 }, { "epoch": 0.65, "learning_rate": 0.0020175363666055323, "loss": 0.1042, "step": 26070 }, { "epoch": 0.66, "learning_rate": 0.002017159510589654, "loss": 0.104, "step": 26080 }, { "epoch": 0.66, "learning_rate": 0.0020167826545737758, "loss": 0.1017, "step": 26090 }, { "epoch": 0.66, "learning_rate": 0.0020164057985578975, "loss": 0.1055, "step": 26100 }, { "epoch": 0.66, "learning_rate": 0.0020160289425420197, "loss": 0.0993, "step": 26110 }, { "epoch": 0.66, "learning_rate": 0.0020156520865261414, "loss": 0.1057, "step": 26120 }, { "epoch": 0.66, "learning_rate": 0.0020152752305102628, "loss": 0.1031, "step": 26130 }, { "epoch": 0.66, "learning_rate": 0.002014898374494385, "loss": 0.1055, "step": 26140 }, { "epoch": 0.66, "learning_rate": 0.0020145215184785067, "loss": 0.1061, "step": 26150 }, { "epoch": 0.66, "learning_rate": 0.0020141446624626284, "loss": 0.0989, "step": 26160 }, { "epoch": 0.66, "learning_rate": 0.00201376780644675, "loss": 0.1023, "step": 26170 }, { "epoch": 0.66, "learning_rate": 0.002013390950430872, "loss": 0.1088, "step": 26180 }, { "epoch": 0.66, "learning_rate": 0.002013014094414994, "loss": 0.1023, "step": 26190 }, { "epoch": 0.66, "learning_rate": 0.002012637238399116, "loss": 0.1028, "step": 26200 }, { "epoch": 0.66, "learning_rate": 0.0020122603823832376, "loss": 0.1036, "step": 26210 }, { "epoch": 0.66, "learning_rate": 0.0020118835263673593, "loss": 0.1035, "step": 26220 }, { "epoch": 0.66, "learning_rate": 0.002011506670351481, "loss": 0.1043, "step": 26230 }, { "epoch": 0.66, "learning_rate": 0.0020111298143356032, "loss": 0.1044, "step": 26240 }, { "epoch": 0.66, "learning_rate": 0.0020107529583197246, "loss": 0.1008, "step": 26250 }, { "epoch": 0.66, "learning_rate": 0.0020103761023038463, "loss": 0.1013, "step": 26260 }, { "epoch": 0.66, "learning_rate": 0.0020099992462879685, "loss": 0.1047, "step": 26270 }, { "epoch": 0.66, "learning_rate": 0.00200962239027209, "loss": 0.1028, "step": 26280 }, { "epoch": 0.66, "learning_rate": 0.002009245534256212, "loss": 0.1029, "step": 26290 }, { "epoch": 0.66, "learning_rate": 0.0020088686782403337, "loss": 0.1066, "step": 26300 }, { "epoch": 0.66, "learning_rate": 0.0020084918222244555, "loss": 0.1083, "step": 26310 }, { "epoch": 0.66, "learning_rate": 0.002008114966208577, "loss": 0.1057, "step": 26320 }, { "epoch": 0.66, "learning_rate": 0.002007738110192699, "loss": 0.1027, "step": 26330 }, { "epoch": 0.66, "learning_rate": 0.002007361254176821, "loss": 0.1038, "step": 26340 }, { "epoch": 0.66, "learning_rate": 0.002006984398160943, "loss": 0.101, "step": 26350 }, { "epoch": 0.66, "learning_rate": 0.002006607542145064, "loss": 0.1049, "step": 26360 }, { "epoch": 0.66, "learning_rate": 0.0020062306861291864, "loss": 0.1054, "step": 26370 }, { "epoch": 0.66, "learning_rate": 0.002005853830113308, "loss": 0.1023, "step": 26380 }, { "epoch": 0.66, "learning_rate": 0.00200547697409743, "loss": 0.109, "step": 26390 }, { "epoch": 0.66, "learning_rate": 0.0020051001180815516, "loss": 0.1058, "step": 26400 }, { "epoch": 0.66, "learning_rate": 0.0020047232620656733, "loss": 0.1033, "step": 26410 }, { "epoch": 0.66, "learning_rate": 0.0020043464060497955, "loss": 0.1067, "step": 26420 }, { "epoch": 0.66, "learning_rate": 0.0020039695500339173, "loss": 0.1058, "step": 26430 }, { "epoch": 0.66, "learning_rate": 0.0020035926940180386, "loss": 0.1033, "step": 26440 }, { "epoch": 0.66, "learning_rate": 0.0020032158380021607, "loss": 0.1034, "step": 26450 }, { "epoch": 0.66, "learning_rate": 0.0020028389819862825, "loss": 0.1055, "step": 26460 }, { "epoch": 0.67, "learning_rate": 0.0020024621259704042, "loss": 0.0989, "step": 26470 }, { "epoch": 0.67, "learning_rate": 0.002002085269954526, "loss": 0.1056, "step": 26480 }, { "epoch": 0.67, "learning_rate": 0.0020017084139386477, "loss": 0.0971, "step": 26490 }, { "epoch": 0.67, "learning_rate": 0.00200133155792277, "loss": 0.1072, "step": 26500 }, { "epoch": 0.67, "eval_cer": 0.6662273033728953, "eval_loss": 0.08107112348079681, "eval_runtime": 90.712, "eval_samples_per_second": 110.228, "eval_steps_per_second": 6.89, "step": 26500 }, { "epoch": 0.67, "learning_rate": 0.0020009547019068912, "loss": 0.1071, "step": 26510 }, { "epoch": 0.67, "learning_rate": 0.0020005778458910134, "loss": 0.1079, "step": 26520 }, { "epoch": 0.67, "learning_rate": 0.002000200989875135, "loss": 0.1031, "step": 26530 }, { "epoch": 0.67, "learning_rate": 0.001999824133859257, "loss": 0.1041, "step": 26540 }, { "epoch": 0.67, "learning_rate": 0.0019994472778433786, "loss": 0.1062, "step": 26550 }, { "epoch": 0.67, "learning_rate": 0.0019990704218275004, "loss": 0.104, "step": 26560 }, { "epoch": 0.67, "learning_rate": 0.001998693565811622, "loss": 0.1036, "step": 26570 }, { "epoch": 0.67, "learning_rate": 0.0019983167097957443, "loss": 0.105, "step": 26580 }, { "epoch": 0.67, "learning_rate": 0.0019979398537798656, "loss": 0.1017, "step": 26590 }, { "epoch": 0.67, "learning_rate": 0.001997562997763988, "loss": 0.0991, "step": 26600 }, { "epoch": 0.67, "learning_rate": 0.0019971861417481095, "loss": 0.1046, "step": 26610 }, { "epoch": 0.67, "learning_rate": 0.0019968092857322313, "loss": 0.1014, "step": 26620 }, { "epoch": 0.67, "learning_rate": 0.001996432429716353, "loss": 0.1016, "step": 26630 }, { "epoch": 0.67, "learning_rate": 0.0019960555737004748, "loss": 0.1029, "step": 26640 }, { "epoch": 0.67, "learning_rate": 0.001995678717684597, "loss": 0.103, "step": 26650 }, { "epoch": 0.67, "learning_rate": 0.0019953018616687187, "loss": 0.1085, "step": 26660 }, { "epoch": 0.67, "learning_rate": 0.00199492500565284, "loss": 0.1062, "step": 26670 }, { "epoch": 0.67, "learning_rate": 0.001994548149636962, "loss": 0.1033, "step": 26680 }, { "epoch": 0.67, "learning_rate": 0.001994171293621084, "loss": 0.1044, "step": 26690 }, { "epoch": 0.67, "learning_rate": 0.0019937944376052057, "loss": 0.1017, "step": 26700 }, { "epoch": 0.67, "learning_rate": 0.0019934175815893274, "loss": 0.1029, "step": 26710 }, { "epoch": 0.67, "learning_rate": 0.001993040725573449, "loss": 0.1026, "step": 26720 }, { "epoch": 0.67, "learning_rate": 0.0019926638695575713, "loss": 0.1004, "step": 26730 }, { "epoch": 0.67, "learning_rate": 0.0019922870135416926, "loss": 0.1052, "step": 26740 }, { "epoch": 0.67, "learning_rate": 0.001991910157525815, "loss": 0.1053, "step": 26750 }, { "epoch": 0.67, "learning_rate": 0.0019915333015099366, "loss": 0.1025, "step": 26760 }, { "epoch": 0.67, "learning_rate": 0.0019911564454940583, "loss": 0.1065, "step": 26770 }, { "epoch": 0.67, "learning_rate": 0.00199077958947818, "loss": 0.1026, "step": 26780 }, { "epoch": 0.67, "learning_rate": 0.001990402733462302, "loss": 0.1062, "step": 26790 }, { "epoch": 0.67, "learning_rate": 0.0019900258774464235, "loss": 0.1052, "step": 26800 }, { "epoch": 0.67, "learning_rate": 0.0019896490214305457, "loss": 0.1018, "step": 26810 }, { "epoch": 0.67, "learning_rate": 0.001989272165414667, "loss": 0.104, "step": 26820 }, { "epoch": 0.67, "learning_rate": 0.001988895309398789, "loss": 0.0998, "step": 26830 }, { "epoch": 0.67, "learning_rate": 0.001988518453382911, "loss": 0.1007, "step": 26840 }, { "epoch": 0.67, "learning_rate": 0.0019881415973670327, "loss": 0.1004, "step": 26850 }, { "epoch": 0.67, "learning_rate": 0.0019877647413511544, "loss": 0.1022, "step": 26860 }, { "epoch": 0.68, "learning_rate": 0.001987387885335276, "loss": 0.1041, "step": 26870 }, { "epoch": 0.68, "learning_rate": 0.001987011029319398, "loss": 0.1023, "step": 26880 }, { "epoch": 0.68, "learning_rate": 0.00198663417330352, "loss": 0.1026, "step": 26890 }, { "epoch": 0.68, "learning_rate": 0.0019862573172876414, "loss": 0.1058, "step": 26900 }, { "epoch": 0.68, "learning_rate": 0.0019858804612717636, "loss": 0.1013, "step": 26910 }, { "epoch": 0.68, "learning_rate": 0.0019855036052558853, "loss": 0.1025, "step": 26920 }, { "epoch": 0.68, "learning_rate": 0.001985126749240007, "loss": 0.1068, "step": 26930 }, { "epoch": 0.68, "learning_rate": 0.001984749893224129, "loss": 0.1007, "step": 26940 }, { "epoch": 0.68, "learning_rate": 0.0019843730372082506, "loss": 0.1057, "step": 26950 }, { "epoch": 0.68, "learning_rate": 0.0019839961811923728, "loss": 0.1009, "step": 26960 }, { "epoch": 0.68, "learning_rate": 0.001983619325176494, "loss": 0.1003, "step": 26970 }, { "epoch": 0.68, "learning_rate": 0.001983242469160616, "loss": 0.1051, "step": 26980 }, { "epoch": 0.68, "learning_rate": 0.001982865613144738, "loss": 0.1025, "step": 26990 }, { "epoch": 0.68, "learning_rate": 0.0019824887571288597, "loss": 0.1023, "step": 27000 }, { "epoch": 0.68, "eval_cer": 0.6660819718124145, "eval_loss": 0.08071926981210709, "eval_runtime": 90.7266, "eval_samples_per_second": 110.21, "eval_steps_per_second": 6.889, "step": 27000 }, { "epoch": 0.68, "learning_rate": 0.0019821119011129815, "loss": 0.0987, "step": 27010 }, { "epoch": 0.68, "learning_rate": 0.0019817350450971032, "loss": 0.1022, "step": 27020 }, { "epoch": 0.68, "learning_rate": 0.001981358189081225, "loss": 0.0997, "step": 27030 }, { "epoch": 0.68, "learning_rate": 0.001980981333065347, "loss": 0.1049, "step": 27040 }, { "epoch": 0.68, "learning_rate": 0.0019806044770494685, "loss": 0.1034, "step": 27050 }, { "epoch": 0.68, "learning_rate": 0.0019802276210335906, "loss": 0.1, "step": 27060 }, { "epoch": 0.68, "learning_rate": 0.0019798507650177124, "loss": 0.0994, "step": 27070 }, { "epoch": 0.68, "learning_rate": 0.001979473909001834, "loss": 0.1041, "step": 27080 }, { "epoch": 0.68, "learning_rate": 0.001979097052985956, "loss": 0.1018, "step": 27090 }, { "epoch": 0.68, "learning_rate": 0.0019787201969700776, "loss": 0.1014, "step": 27100 }, { "epoch": 0.68, "learning_rate": 0.0019783433409541994, "loss": 0.1062, "step": 27110 }, { "epoch": 0.68, "learning_rate": 0.0019779664849383215, "loss": 0.1003, "step": 27120 }, { "epoch": 0.68, "learning_rate": 0.001977589628922443, "loss": 0.1022, "step": 27130 }, { "epoch": 0.68, "learning_rate": 0.001977212772906565, "loss": 0.1028, "step": 27140 }, { "epoch": 0.68, "learning_rate": 0.0019768359168906868, "loss": 0.0999, "step": 27150 }, { "epoch": 0.68, "learning_rate": 0.0019764590608748085, "loss": 0.1009, "step": 27160 }, { "epoch": 0.68, "learning_rate": 0.0019760822048589303, "loss": 0.0997, "step": 27170 }, { "epoch": 0.68, "learning_rate": 0.001975705348843052, "loss": 0.1038, "step": 27180 }, { "epoch": 0.68, "learning_rate": 0.001975328492827174, "loss": 0.1025, "step": 27190 }, { "epoch": 0.68, "learning_rate": 0.0019749516368112955, "loss": 0.1024, "step": 27200 }, { "epoch": 0.68, "learning_rate": 0.0019745747807954172, "loss": 0.1022, "step": 27210 }, { "epoch": 0.68, "learning_rate": 0.0019741979247795394, "loss": 0.0983, "step": 27220 }, { "epoch": 0.68, "learning_rate": 0.001973821068763661, "loss": 0.1008, "step": 27230 }, { "epoch": 0.68, "learning_rate": 0.001973444212747783, "loss": 0.1035, "step": 27240 }, { "epoch": 0.68, "learning_rate": 0.0019730673567319047, "loss": 0.1023, "step": 27250 }, { "epoch": 0.68, "learning_rate": 0.0019726905007160264, "loss": 0.1032, "step": 27260 }, { "epoch": 0.69, "learning_rate": 0.0019723136447001486, "loss": 0.0987, "step": 27270 }, { "epoch": 0.69, "learning_rate": 0.00197193678868427, "loss": 0.101, "step": 27280 }, { "epoch": 0.69, "learning_rate": 0.0019715599326683916, "loss": 0.0983, "step": 27290 }, { "epoch": 0.69, "learning_rate": 0.001971183076652514, "loss": 0.0978, "step": 27300 }, { "epoch": 0.69, "learning_rate": 0.0019708062206366356, "loss": 0.1028, "step": 27310 }, { "epoch": 0.69, "learning_rate": 0.0019704293646207573, "loss": 0.1008, "step": 27320 }, { "epoch": 0.69, "learning_rate": 0.001970052508604879, "loss": 0.1033, "step": 27330 }, { "epoch": 0.69, "learning_rate": 0.001969675652589001, "loss": 0.1035, "step": 27340 }, { "epoch": 0.69, "learning_rate": 0.001969298796573123, "loss": 0.1016, "step": 27350 }, { "epoch": 0.69, "learning_rate": 0.0019689219405572443, "loss": 0.1005, "step": 27360 }, { "epoch": 0.69, "learning_rate": 0.0019685450845413665, "loss": 0.1041, "step": 27370 }, { "epoch": 0.69, "learning_rate": 0.001968168228525488, "loss": 0.1032, "step": 27380 }, { "epoch": 0.69, "learning_rate": 0.0019677913725096095, "loss": 0.0945, "step": 27390 }, { "epoch": 0.69, "learning_rate": 0.0019674145164937317, "loss": 0.1027, "step": 27400 }, { "epoch": 0.69, "learning_rate": 0.0019670376604778534, "loss": 0.1041, "step": 27410 }, { "epoch": 0.69, "learning_rate": 0.001966660804461975, "loss": 0.1044, "step": 27420 }, { "epoch": 0.69, "learning_rate": 0.001966283948446097, "loss": 0.1061, "step": 27430 }, { "epoch": 0.69, "learning_rate": 0.0019659070924302187, "loss": 0.1008, "step": 27440 }, { "epoch": 0.69, "learning_rate": 0.001965530236414341, "loss": 0.1006, "step": 27450 }, { "epoch": 0.69, "learning_rate": 0.0019651533803984626, "loss": 0.0987, "step": 27460 }, { "epoch": 0.69, "learning_rate": 0.0019647765243825843, "loss": 0.1013, "step": 27470 }, { "epoch": 0.69, "learning_rate": 0.001964399668366706, "loss": 0.0994, "step": 27480 }, { "epoch": 0.69, "learning_rate": 0.001964022812350828, "loss": 0.1045, "step": 27490 }, { "epoch": 0.69, "learning_rate": 0.00196364595633495, "loss": 0.1013, "step": 27500 }, { "epoch": 0.69, "eval_cer": 0.6664063210566663, "eval_loss": 0.08010150492191315, "eval_runtime": 90.5425, "eval_samples_per_second": 110.434, "eval_steps_per_second": 6.903, "step": 27500 }, { "epoch": 0.69, "learning_rate": 0.0019632691003190713, "loss": 0.1035, "step": 27510 }, { "epoch": 0.69, "learning_rate": 0.001962892244303193, "loss": 0.1013, "step": 27520 }, { "epoch": 0.69, "learning_rate": 0.0019625153882873152, "loss": 0.1041, "step": 27530 }, { "epoch": 0.69, "learning_rate": 0.001962138532271437, "loss": 0.1011, "step": 27540 }, { "epoch": 0.69, "learning_rate": 0.0019617616762555587, "loss": 0.1012, "step": 27550 }, { "epoch": 0.69, "learning_rate": 0.0019613848202396805, "loss": 0.1019, "step": 27560 }, { "epoch": 0.69, "learning_rate": 0.0019610079642238022, "loss": 0.0998, "step": 27570 }, { "epoch": 0.69, "learning_rate": 0.0019606311082079244, "loss": 0.0991, "step": 27580 }, { "epoch": 0.69, "learning_rate": 0.0019602542521920457, "loss": 0.1025, "step": 27590 }, { "epoch": 0.69, "learning_rate": 0.001959877396176168, "loss": 0.0997, "step": 27600 }, { "epoch": 0.69, "learning_rate": 0.0019595005401602896, "loss": 0.104, "step": 27610 }, { "epoch": 0.69, "learning_rate": 0.001959123684144411, "loss": 0.1013, "step": 27620 }, { "epoch": 0.69, "learning_rate": 0.001958746828128533, "loss": 0.1012, "step": 27630 }, { "epoch": 0.69, "learning_rate": 0.001958369972112655, "loss": 0.1017, "step": 27640 }, { "epoch": 0.69, "learning_rate": 0.0019579931160967766, "loss": 0.1034, "step": 27650 }, { "epoch": 0.69, "learning_rate": 0.0019576162600808984, "loss": 0.1005, "step": 27660 }, { "epoch": 0.7, "learning_rate": 0.00195723940406502, "loss": 0.1005, "step": 27670 }, { "epoch": 0.7, "learning_rate": 0.0019568625480491423, "loss": 0.1019, "step": 27680 }, { "epoch": 0.7, "learning_rate": 0.001956485692033264, "loss": 0.1018, "step": 27690 }, { "epoch": 0.7, "learning_rate": 0.0019561088360173853, "loss": 0.1023, "step": 27700 }, { "epoch": 0.7, "learning_rate": 0.0019557319800015075, "loss": 0.1031, "step": 27710 }, { "epoch": 0.7, "learning_rate": 0.0019553551239856293, "loss": 0.1028, "step": 27720 }, { "epoch": 0.7, "learning_rate": 0.001954978267969751, "loss": 0.0986, "step": 27730 }, { "epoch": 0.7, "learning_rate": 0.0019546014119538727, "loss": 0.1046, "step": 27740 }, { "epoch": 0.7, "learning_rate": 0.0019542245559379945, "loss": 0.101, "step": 27750 }, { "epoch": 0.7, "learning_rate": 0.0019538476999221167, "loss": 0.1045, "step": 27760 }, { "epoch": 0.7, "learning_rate": 0.0019534708439062384, "loss": 0.103, "step": 27770 }, { "epoch": 0.7, "learning_rate": 0.00195309398789036, "loss": 0.1023, "step": 27780 }, { "epoch": 0.7, "learning_rate": 0.001952717131874482, "loss": 0.1007, "step": 27790 }, { "epoch": 0.7, "learning_rate": 0.0019523402758586036, "loss": 0.1021, "step": 27800 }, { "epoch": 0.7, "learning_rate": 0.0019519634198427256, "loss": 0.1061, "step": 27810 }, { "epoch": 0.7, "learning_rate": 0.0019515865638268471, "loss": 0.1013, "step": 27820 }, { "epoch": 0.7, "learning_rate": 0.001951209707810969, "loss": 0.1039, "step": 27830 }, { "epoch": 0.7, "learning_rate": 0.001950832851795091, "loss": 0.1005, "step": 27840 }, { "epoch": 0.7, "learning_rate": 0.0019504559957792126, "loss": 0.1013, "step": 27850 }, { "epoch": 0.7, "learning_rate": 0.0019500791397633343, "loss": 0.1003, "step": 27860 }, { "epoch": 0.7, "learning_rate": 0.0019497022837474563, "loss": 0.099, "step": 27870 }, { "epoch": 0.7, "learning_rate": 0.0019493254277315783, "loss": 0.1027, "step": 27880 }, { "epoch": 0.7, "learning_rate": 0.0019489485717156998, "loss": 0.0979, "step": 27890 }, { "epoch": 0.7, "learning_rate": 0.0019485717156998215, "loss": 0.1025, "step": 27900 }, { "epoch": 0.7, "learning_rate": 0.0019481948596839435, "loss": 0.0973, "step": 27910 }, { "epoch": 0.7, "learning_rate": 0.0019478180036680654, "loss": 0.1003, "step": 27920 }, { "epoch": 0.7, "learning_rate": 0.001947441147652187, "loss": 0.1009, "step": 27930 }, { "epoch": 0.7, "learning_rate": 0.0019470642916363087, "loss": 0.0995, "step": 27940 }, { "epoch": 0.7, "learning_rate": 0.0019466874356204307, "loss": 0.0998, "step": 27950 }, { "epoch": 0.7, "learning_rate": 0.0019463105796045526, "loss": 0.0988, "step": 27960 }, { "epoch": 0.7, "learning_rate": 0.0019459337235886742, "loss": 0.1018, "step": 27970 }, { "epoch": 0.7, "learning_rate": 0.0019455568675727961, "loss": 0.1023, "step": 27980 }, { "epoch": 0.7, "learning_rate": 0.0019451800115569179, "loss": 0.099, "step": 27990 }, { "epoch": 0.7, "learning_rate": 0.0019448031555410398, "loss": 0.0986, "step": 28000 }, { "epoch": 0.7, "eval_cer": 0.6663938090680156, "eval_loss": 0.07968434691429138, "eval_runtime": 90.6337, "eval_samples_per_second": 110.323, "eval_steps_per_second": 6.896, "step": 28000 }, { "epoch": 0.7, "learning_rate": 0.0019444262995251614, "loss": 0.1032, "step": 28010 }, { "epoch": 0.7, "learning_rate": 0.0019440494435092833, "loss": 0.0981, "step": 28020 }, { "epoch": 0.7, "learning_rate": 0.001943672587493405, "loss": 0.1021, "step": 28030 }, { "epoch": 0.7, "learning_rate": 0.0019432957314775266, "loss": 0.0998, "step": 28040 }, { "epoch": 0.7, "learning_rate": 0.0019429188754616486, "loss": 0.1031, "step": 28050 }, { "epoch": 0.7, "learning_rate": 0.0019425420194457705, "loss": 0.1053, "step": 28060 }, { "epoch": 0.71, "learning_rate": 0.0019421651634298923, "loss": 0.1035, "step": 28070 }, { "epoch": 0.71, "learning_rate": 0.001941788307414014, "loss": 0.101, "step": 28080 }, { "epoch": 0.71, "learning_rate": 0.0019414114513981358, "loss": 0.1014, "step": 28090 }, { "epoch": 0.71, "learning_rate": 0.0019410345953822577, "loss": 0.0977, "step": 28100 }, { "epoch": 0.71, "learning_rate": 0.0019406577393663795, "loss": 0.0996, "step": 28110 }, { "epoch": 0.71, "learning_rate": 0.0019402808833505012, "loss": 0.0977, "step": 28120 }, { "epoch": 0.71, "learning_rate": 0.001939904027334623, "loss": 0.1009, "step": 28130 }, { "epoch": 0.71, "learning_rate": 0.001939527171318745, "loss": 0.1008, "step": 28140 }, { "epoch": 0.71, "learning_rate": 0.0019391503153028669, "loss": 0.1033, "step": 28150 }, { "epoch": 0.71, "learning_rate": 0.0019387734592869884, "loss": 0.1008, "step": 28160 }, { "epoch": 0.71, "learning_rate": 0.0019383966032711101, "loss": 0.1006, "step": 28170 }, { "epoch": 0.71, "learning_rate": 0.0019380197472552321, "loss": 0.1, "step": 28180 }, { "epoch": 0.71, "learning_rate": 0.001937642891239354, "loss": 0.1031, "step": 28190 }, { "epoch": 0.71, "learning_rate": 0.0019372660352234756, "loss": 0.1011, "step": 28200 }, { "epoch": 0.71, "learning_rate": 0.0019368891792075973, "loss": 0.1005, "step": 28210 }, { "epoch": 0.71, "learning_rate": 0.0019365123231917193, "loss": 0.0974, "step": 28220 }, { "epoch": 0.71, "learning_rate": 0.0019361354671758413, "loss": 0.1, "step": 28230 }, { "epoch": 0.71, "learning_rate": 0.0019357586111599628, "loss": 0.0995, "step": 28240 }, { "epoch": 0.71, "learning_rate": 0.0019353817551440848, "loss": 0.0999, "step": 28250 }, { "epoch": 0.71, "learning_rate": 0.0019350048991282065, "loss": 0.0997, "step": 28260 }, { "epoch": 0.71, "learning_rate": 0.001934628043112328, "loss": 0.0988, "step": 28270 }, { "epoch": 0.71, "learning_rate": 0.00193425118709645, "loss": 0.1054, "step": 28280 }, { "epoch": 0.71, "learning_rate": 0.001933874331080572, "loss": 0.0984, "step": 28290 }, { "epoch": 0.71, "learning_rate": 0.0019334974750646937, "loss": 0.0963, "step": 28300 }, { "epoch": 0.71, "learning_rate": 0.0019331206190488152, "loss": 0.0975, "step": 28310 }, { "epoch": 0.71, "learning_rate": 0.0019327437630329372, "loss": 0.0986, "step": 28320 }, { "epoch": 0.71, "learning_rate": 0.0019323669070170591, "loss": 0.103, "step": 28330 }, { "epoch": 0.71, "learning_rate": 0.001931990051001181, "loss": 0.0999, "step": 28340 }, { "epoch": 0.71, "learning_rate": 0.0019316131949853024, "loss": 0.1017, "step": 28350 }, { "epoch": 0.71, "learning_rate": 0.0019312363389694244, "loss": 0.1024, "step": 28360 }, { "epoch": 0.71, "learning_rate": 0.0019308594829535463, "loss": 0.0984, "step": 28370 }, { "epoch": 0.71, "learning_rate": 0.001930482626937668, "loss": 0.0992, "step": 28380 }, { "epoch": 0.71, "learning_rate": 0.0019301057709217898, "loss": 0.1043, "step": 28390 }, { "epoch": 0.71, "learning_rate": 0.0019297289149059116, "loss": 0.1006, "step": 28400 }, { "epoch": 0.71, "learning_rate": 0.0019293520588900335, "loss": 0.1026, "step": 28410 }, { "epoch": 0.71, "learning_rate": 0.0019289752028741555, "loss": 0.1009, "step": 28420 }, { "epoch": 0.71, "learning_rate": 0.001928598346858277, "loss": 0.1028, "step": 28430 }, { "epoch": 0.71, "learning_rate": 0.0019282214908423988, "loss": 0.1039, "step": 28440 }, { "epoch": 0.71, "learning_rate": 0.0019278446348265207, "loss": 0.0983, "step": 28450 }, { "epoch": 0.72, "learning_rate": 0.0019274677788106427, "loss": 0.0987, "step": 28460 }, { "epoch": 0.72, "learning_rate": 0.0019270909227947642, "loss": 0.0997, "step": 28470 }, { "epoch": 0.72, "learning_rate": 0.001926714066778886, "loss": 0.1033, "step": 28480 }, { "epoch": 0.72, "learning_rate": 0.001926337210763008, "loss": 0.1025, "step": 28490 }, { "epoch": 0.72, "learning_rate": 0.0019259603547471295, "loss": 0.1022, "step": 28500 }, { "epoch": 0.72, "eval_cer": 0.6661753304969618, "eval_loss": 0.07863720506429672, "eval_runtime": 90.541, "eval_samples_per_second": 110.436, "eval_steps_per_second": 6.903, "step": 28500 }, { "epoch": 0.72, "learning_rate": 0.0019255834987312514, "loss": 0.1002, "step": 28510 }, { "epoch": 0.72, "learning_rate": 0.0019252066427153732, "loss": 0.0997, "step": 28520 }, { "epoch": 0.72, "learning_rate": 0.0019248297866994951, "loss": 0.1005, "step": 28530 }, { "epoch": 0.72, "learning_rate": 0.0019244529306836167, "loss": 0.099, "step": 28540 }, { "epoch": 0.72, "learning_rate": 0.0019240760746677386, "loss": 0.1016, "step": 28550 }, { "epoch": 0.72, "learning_rate": 0.0019236992186518606, "loss": 0.1033, "step": 28560 }, { "epoch": 0.72, "learning_rate": 0.0019233223626359823, "loss": 0.099, "step": 28570 }, { "epoch": 0.72, "learning_rate": 0.0019229455066201038, "loss": 0.0997, "step": 28580 }, { "epoch": 0.72, "learning_rate": 0.0019225686506042258, "loss": 0.0981, "step": 28590 }, { "epoch": 0.72, "learning_rate": 0.0019221917945883478, "loss": 0.0975, "step": 28600 }, { "epoch": 0.72, "learning_rate": 0.0019218149385724695, "loss": 0.1016, "step": 28610 }, { "epoch": 0.72, "learning_rate": 0.001921438082556591, "loss": 0.0965, "step": 28620 }, { "epoch": 0.72, "learning_rate": 0.001921061226540713, "loss": 0.1033, "step": 28630 }, { "epoch": 0.72, "learning_rate": 0.001920684370524835, "loss": 0.1017, "step": 28640 }, { "epoch": 0.72, "learning_rate": 0.0019203075145089567, "loss": 0.1016, "step": 28650 }, { "epoch": 0.72, "learning_rate": 0.0019199306584930785, "loss": 0.1009, "step": 28660 }, { "epoch": 0.72, "learning_rate": 0.0019195538024772002, "loss": 0.1024, "step": 28670 }, { "epoch": 0.72, "learning_rate": 0.0019191769464613222, "loss": 0.0999, "step": 28680 }, { "epoch": 0.72, "learning_rate": 0.001918800090445444, "loss": 0.1023, "step": 28690 }, { "epoch": 0.72, "learning_rate": 0.0019184232344295657, "loss": 0.1016, "step": 28700 }, { "epoch": 0.72, "learning_rate": 0.0019180463784136874, "loss": 0.1027, "step": 28710 }, { "epoch": 0.72, "learning_rate": 0.0019176695223978094, "loss": 0.1039, "step": 28720 }, { "epoch": 0.72, "learning_rate": 0.0019172926663819309, "loss": 0.0976, "step": 28730 }, { "epoch": 0.72, "learning_rate": 0.0019169158103660528, "loss": 0.0989, "step": 28740 }, { "epoch": 0.72, "learning_rate": 0.0019165389543501746, "loss": 0.0977, "step": 28750 }, { "epoch": 0.72, "learning_rate": 0.0019161620983342966, "loss": 0.0974, "step": 28760 }, { "epoch": 0.72, "learning_rate": 0.001915785242318418, "loss": 0.1004, "step": 28770 }, { "epoch": 0.72, "learning_rate": 0.00191540838630254, "loss": 0.0977, "step": 28780 }, { "epoch": 0.72, "learning_rate": 0.0019150315302866618, "loss": 0.1007, "step": 28790 }, { "epoch": 0.72, "learning_rate": 0.0019146546742707837, "loss": 0.0981, "step": 28800 }, { "epoch": 0.72, "learning_rate": 0.0019142778182549053, "loss": 0.1005, "step": 28810 }, { "epoch": 0.72, "learning_rate": 0.0019139009622390272, "loss": 0.099, "step": 28820 }, { "epoch": 0.72, "learning_rate": 0.0019135241062231492, "loss": 0.0974, "step": 28830 }, { "epoch": 0.72, "learning_rate": 0.001913147250207271, "loss": 0.097, "step": 28840 }, { "epoch": 0.72, "learning_rate": 0.0019127703941913925, "loss": 0.0989, "step": 28850 }, { "epoch": 0.73, "learning_rate": 0.0019123935381755144, "loss": 0.0987, "step": 28860 }, { "epoch": 0.73, "learning_rate": 0.0019120166821596364, "loss": 0.0988, "step": 28870 }, { "epoch": 0.73, "learning_rate": 0.0019116398261437581, "loss": 0.0983, "step": 28880 }, { "epoch": 0.73, "learning_rate": 0.0019112629701278797, "loss": 0.1038, "step": 28890 }, { "epoch": 0.73, "learning_rate": 0.0019108861141120016, "loss": 0.0969, "step": 28900 }, { "epoch": 0.73, "learning_rate": 0.0019105092580961236, "loss": 0.1002, "step": 28910 }, { "epoch": 0.73, "learning_rate": 0.0019101324020802453, "loss": 0.0995, "step": 28920 }, { "epoch": 0.73, "learning_rate": 0.0019097555460643669, "loss": 0.0996, "step": 28930 }, { "epoch": 0.73, "learning_rate": 0.0019093786900484888, "loss": 0.0971, "step": 28940 }, { "epoch": 0.73, "learning_rate": 0.0019090018340326108, "loss": 0.101, "step": 28950 }, { "epoch": 0.73, "learning_rate": 0.0019086249780167323, "loss": 0.0991, "step": 28960 }, { "epoch": 0.73, "learning_rate": 0.0019082481220008543, "loss": 0.1009, "step": 28970 }, { "epoch": 0.73, "learning_rate": 0.001907871265984976, "loss": 0.0994, "step": 28980 }, { "epoch": 0.73, "learning_rate": 0.001907494409969098, "loss": 0.0986, "step": 28990 }, { "epoch": 0.73, "learning_rate": 0.0019071175539532195, "loss": 0.0984, "step": 29000 }, { "epoch": 0.73, "eval_cer": 0.6658707116963514, "eval_loss": 0.07814398407936096, "eval_runtime": 90.6335, "eval_samples_per_second": 110.323, "eval_steps_per_second": 6.896, "step": 29000 }, { "epoch": 0.73, "learning_rate": 0.0019067406979373415, "loss": 0.1015, "step": 29010 }, { "epoch": 0.73, "learning_rate": 0.0019063638419214632, "loss": 0.1036, "step": 29020 }, { "epoch": 0.73, "learning_rate": 0.0019059869859055852, "loss": 0.096, "step": 29030 }, { "epoch": 0.73, "learning_rate": 0.0019056101298897067, "loss": 0.0991, "step": 29040 }, { "epoch": 0.73, "learning_rate": 0.0019052332738738287, "loss": 0.0942, "step": 29050 }, { "epoch": 0.73, "learning_rate": 0.0019048564178579504, "loss": 0.1032, "step": 29060 }, { "epoch": 0.73, "learning_rate": 0.0019044795618420724, "loss": 0.099, "step": 29070 }, { "epoch": 0.73, "learning_rate": 0.001904102705826194, "loss": 0.1025, "step": 29080 }, { "epoch": 0.73, "learning_rate": 0.0019037258498103159, "loss": 0.0979, "step": 29090 }, { "epoch": 0.73, "learning_rate": 0.0019033489937944376, "loss": 0.097, "step": 29100 }, { "epoch": 0.73, "learning_rate": 0.0019029721377785596, "loss": 0.0972, "step": 29110 }, { "epoch": 0.73, "learning_rate": 0.001902595281762681, "loss": 0.0996, "step": 29120 }, { "epoch": 0.73, "learning_rate": 0.001902218425746803, "loss": 0.0989, "step": 29130 }, { "epoch": 0.73, "learning_rate": 0.001901841569730925, "loss": 0.1029, "step": 29140 }, { "epoch": 0.73, "learning_rate": 0.0019014647137150465, "loss": 0.0997, "step": 29150 }, { "epoch": 0.73, "learning_rate": 0.0019010878576991683, "loss": 0.0979, "step": 29160 }, { "epoch": 0.73, "learning_rate": 0.0019007110016832902, "loss": 0.0987, "step": 29170 }, { "epoch": 0.73, "learning_rate": 0.0019003341456674122, "loss": 0.1012, "step": 29180 }, { "epoch": 0.73, "learning_rate": 0.0018999572896515337, "loss": 0.0981, "step": 29190 }, { "epoch": 0.73, "learning_rate": 0.0018995804336356555, "loss": 0.1002, "step": 29200 }, { "epoch": 0.73, "learning_rate": 0.0018992035776197774, "loss": 0.0982, "step": 29210 }, { "epoch": 0.73, "learning_rate": 0.0018988267216038994, "loss": 0.0995, "step": 29220 }, { "epoch": 0.73, "learning_rate": 0.001898449865588021, "loss": 0.0998, "step": 29230 }, { "epoch": 0.73, "learning_rate": 0.001898073009572143, "loss": 0.0971, "step": 29240 }, { "epoch": 0.73, "learning_rate": 0.0018976961535562646, "loss": 0.1025, "step": 29250 }, { "epoch": 0.74, "learning_rate": 0.0018973192975403866, "loss": 0.0967, "step": 29260 }, { "epoch": 0.74, "learning_rate": 0.0018969424415245081, "loss": 0.0998, "step": 29270 }, { "epoch": 0.74, "learning_rate": 0.00189656558550863, "loss": 0.0982, "step": 29280 }, { "epoch": 0.74, "learning_rate": 0.0018961887294927518, "loss": 0.1012, "step": 29290 }, { "epoch": 0.74, "learning_rate": 0.0018958118734768738, "loss": 0.0985, "step": 29300 }, { "epoch": 0.74, "learning_rate": 0.0018954350174609953, "loss": 0.0973, "step": 29310 }, { "epoch": 0.74, "learning_rate": 0.0018950581614451173, "loss": 0.096, "step": 29320 }, { "epoch": 0.74, "learning_rate": 0.001894681305429239, "loss": 0.0981, "step": 29330 }, { "epoch": 0.74, "learning_rate": 0.001894304449413361, "loss": 0.1002, "step": 29340 }, { "epoch": 0.74, "learning_rate": 0.0018939275933974825, "loss": 0.0987, "step": 29350 }, { "epoch": 0.74, "learning_rate": 0.0018935507373816045, "loss": 0.0973, "step": 29360 }, { "epoch": 0.74, "learning_rate": 0.0018931738813657262, "loss": 0.1002, "step": 29370 }, { "epoch": 0.74, "learning_rate": 0.001892797025349848, "loss": 0.0955, "step": 29380 }, { "epoch": 0.74, "learning_rate": 0.0018924201693339697, "loss": 0.0967, "step": 29390 }, { "epoch": 0.74, "learning_rate": 0.0018920433133180917, "loss": 0.1002, "step": 29400 }, { "epoch": 0.74, "learning_rate": 0.0018916664573022136, "loss": 0.0958, "step": 29410 }, { "epoch": 0.74, "learning_rate": 0.0018912896012863352, "loss": 0.0999, "step": 29420 }, { "epoch": 0.74, "learning_rate": 0.001890912745270457, "loss": 0.0973, "step": 29430 }, { "epoch": 0.74, "learning_rate": 0.0018905358892545789, "loss": 0.0988, "step": 29440 }, { "epoch": 0.74, "learning_rate": 0.0018901590332387008, "loss": 0.0957, "step": 29450 }, { "epoch": 0.74, "learning_rate": 0.0018897821772228224, "loss": 0.0978, "step": 29460 }, { "epoch": 0.74, "learning_rate": 0.001889405321206944, "loss": 0.1017, "step": 29470 }, { "epoch": 0.74, "learning_rate": 0.001889028465191066, "loss": 0.0977, "step": 29480 }, { "epoch": 0.74, "learning_rate": 0.001888651609175188, "loss": 0.0997, "step": 29490 }, { "epoch": 0.74, "learning_rate": 0.0018882747531593096, "loss": 0.0971, "step": 29500 }, { "epoch": 0.74, "eval_cer": 0.6662253784515644, "eval_loss": 0.077802374958992, "eval_runtime": 90.7555, "eval_samples_per_second": 110.175, "eval_steps_per_second": 6.887, "step": 29500 }, { "epoch": 0.74, "learning_rate": 0.0018878978971434313, "loss": 0.0972, "step": 29510 }, { "epoch": 0.74, "learning_rate": 0.0018875210411275533, "loss": 0.0957, "step": 29520 }, { "epoch": 0.74, "learning_rate": 0.0018871441851116752, "loss": 0.097, "step": 29530 }, { "epoch": 0.74, "learning_rate": 0.0018867673290957968, "loss": 0.0929, "step": 29540 }, { "epoch": 0.74, "learning_rate": 0.0018863904730799187, "loss": 0.0968, "step": 29550 }, { "epoch": 0.74, "learning_rate": 0.0018860136170640405, "loss": 0.0981, "step": 29560 }, { "epoch": 0.74, "learning_rate": 0.0018856367610481624, "loss": 0.0977, "step": 29570 }, { "epoch": 0.74, "learning_rate": 0.001885259905032284, "loss": 0.0952, "step": 29580 }, { "epoch": 0.74, "learning_rate": 0.001884883049016406, "loss": 0.097, "step": 29590 }, { "epoch": 0.74, "learning_rate": 0.0018845061930005277, "loss": 0.0973, "step": 29600 }, { "epoch": 0.74, "learning_rate": 0.0018841293369846492, "loss": 0.1026, "step": 29610 }, { "epoch": 0.74, "learning_rate": 0.0018837524809687711, "loss": 0.0981, "step": 29620 }, { "epoch": 0.74, "learning_rate": 0.001883375624952893, "loss": 0.0977, "step": 29630 }, { "epoch": 0.74, "learning_rate": 0.0018829987689370148, "loss": 0.0956, "step": 29640 }, { "epoch": 0.74, "learning_rate": 0.0018826219129211366, "loss": 0.0967, "step": 29650 }, { "epoch": 0.75, "learning_rate": 0.0018822450569052583, "loss": 0.0986, "step": 29660 }, { "epoch": 0.75, "learning_rate": 0.0018818682008893803, "loss": 0.0916, "step": 29670 }, { "epoch": 0.75, "learning_rate": 0.0018814913448735023, "loss": 0.1046, "step": 29680 }, { "epoch": 0.75, "learning_rate": 0.0018811144888576238, "loss": 0.0966, "step": 29690 }, { "epoch": 0.75, "learning_rate": 0.0018807376328417455, "loss": 0.0959, "step": 29700 }, { "epoch": 0.75, "learning_rate": 0.0018803607768258675, "loss": 0.099, "step": 29710 }, { "epoch": 0.75, "learning_rate": 0.0018799839208099895, "loss": 0.0978, "step": 29720 }, { "epoch": 0.75, "learning_rate": 0.001879607064794111, "loss": 0.0946, "step": 29730 }, { "epoch": 0.75, "learning_rate": 0.0018792302087782327, "loss": 0.0966, "step": 29740 }, { "epoch": 0.75, "learning_rate": 0.0018788533527623547, "loss": 0.0984, "step": 29750 }, { "epoch": 0.75, "learning_rate": 0.0018784764967464767, "loss": 0.1024, "step": 29760 }, { "epoch": 0.75, "learning_rate": 0.0018780996407305982, "loss": 0.0986, "step": 29770 }, { "epoch": 0.75, "learning_rate": 0.00187772278471472, "loss": 0.0995, "step": 29780 }, { "epoch": 0.75, "learning_rate": 0.0018773459286988419, "loss": 0.0969, "step": 29790 }, { "epoch": 0.75, "learning_rate": 0.0018769690726829638, "loss": 0.1, "step": 29800 }, { "epoch": 0.75, "learning_rate": 0.0018765922166670854, "loss": 0.1014, "step": 29810 }, { "epoch": 0.75, "learning_rate": 0.0018762153606512073, "loss": 0.0982, "step": 29820 }, { "epoch": 0.75, "learning_rate": 0.001875838504635329, "loss": 0.0963, "step": 29830 }, { "epoch": 0.75, "learning_rate": 0.0018754616486194506, "loss": 0.0949, "step": 29840 }, { "epoch": 0.75, "learning_rate": 0.0018750847926035726, "loss": 0.1005, "step": 29850 }, { "epoch": 0.75, "learning_rate": 0.0018747079365876945, "loss": 0.0978, "step": 29860 }, { "epoch": 0.75, "learning_rate": 0.0018743310805718163, "loss": 0.0981, "step": 29870 }, { "epoch": 0.75, "learning_rate": 0.0018739542245559378, "loss": 0.0951, "step": 29880 }, { "epoch": 0.75, "learning_rate": 0.0018735773685400598, "loss": 0.0977, "step": 29890 }, { "epoch": 0.75, "learning_rate": 0.0018732005125241817, "loss": 0.0988, "step": 29900 }, { "epoch": 0.75, "learning_rate": 0.0018728236565083035, "loss": 0.1009, "step": 29910 }, { "epoch": 0.75, "learning_rate": 0.001872446800492425, "loss": 0.0997, "step": 29920 }, { "epoch": 0.75, "learning_rate": 0.001872069944476547, "loss": 0.0971, "step": 29930 }, { "epoch": 0.75, "learning_rate": 0.001871693088460669, "loss": 0.1, "step": 29940 }, { "epoch": 0.75, "learning_rate": 0.0018713162324447907, "loss": 0.0997, "step": 29950 }, { "epoch": 0.75, "learning_rate": 0.0018709393764289124, "loss": 0.1002, "step": 29960 }, { "epoch": 0.75, "learning_rate": 0.0018705625204130342, "loss": 0.0974, "step": 29970 }, { "epoch": 0.75, "learning_rate": 0.0018701856643971561, "loss": 0.0967, "step": 29980 }, { "epoch": 0.75, "learning_rate": 0.001869808808381278, "loss": 0.0904, "step": 29990 }, { "epoch": 0.75, "learning_rate": 0.0018694319523653996, "loss": 0.0963, "step": 30000 }, { "epoch": 0.75, "eval_cer": 0.6659708076055567, "eval_loss": 0.07728173583745956, "eval_runtime": 90.6693, "eval_samples_per_second": 110.28, "eval_steps_per_second": 6.893, "step": 30000 }, { "epoch": 0.75, "learning_rate": 0.0018690550963495214, "loss": 0.1015, "step": 30010 }, { "epoch": 0.75, "learning_rate": 0.0018686782403336433, "loss": 0.0994, "step": 30020 }, { "epoch": 0.75, "learning_rate": 0.0018683013843177653, "loss": 0.1013, "step": 30030 }, { "epoch": 0.75, "learning_rate": 0.0018679245283018868, "loss": 0.0995, "step": 30040 }, { "epoch": 0.75, "learning_rate": 0.0018675476722860085, "loss": 0.0963, "step": 30050 }, { "epoch": 0.76, "learning_rate": 0.0018671708162701305, "loss": 0.0978, "step": 30060 }, { "epoch": 0.76, "learning_rate": 0.001866793960254252, "loss": 0.0989, "step": 30070 }, { "epoch": 0.76, "learning_rate": 0.001866417104238374, "loss": 0.0997, "step": 30080 }, { "epoch": 0.76, "learning_rate": 0.0018660402482224957, "loss": 0.0986, "step": 30090 }, { "epoch": 0.76, "learning_rate": 0.0018656633922066177, "loss": 0.0961, "step": 30100 }, { "epoch": 0.76, "learning_rate": 0.0018652865361907392, "loss": 0.0952, "step": 30110 }, { "epoch": 0.76, "learning_rate": 0.0018649096801748612, "loss": 0.0959, "step": 30120 }, { "epoch": 0.76, "learning_rate": 0.0018645328241589832, "loss": 0.0975, "step": 30130 }, { "epoch": 0.76, "learning_rate": 0.001864155968143105, "loss": 0.0911, "step": 30140 }, { "epoch": 0.76, "learning_rate": 0.0018637791121272264, "loss": 0.0977, "step": 30150 }, { "epoch": 0.76, "learning_rate": 0.0018634022561113484, "loss": 0.0958, "step": 30160 }, { "epoch": 0.76, "learning_rate": 0.0018630254000954704, "loss": 0.0987, "step": 30170 }, { "epoch": 0.76, "learning_rate": 0.001862648544079592, "loss": 0.0973, "step": 30180 }, { "epoch": 0.76, "learning_rate": 0.0018622716880637136, "loss": 0.0995, "step": 30190 }, { "epoch": 0.76, "learning_rate": 0.0018618948320478356, "loss": 0.0998, "step": 30200 }, { "epoch": 0.76, "learning_rate": 0.0018615179760319575, "loss": 0.0989, "step": 30210 }, { "epoch": 0.76, "learning_rate": 0.0018611411200160793, "loss": 0.1, "step": 30220 }, { "epoch": 0.76, "learning_rate": 0.001860764264000201, "loss": 0.0991, "step": 30230 }, { "epoch": 0.76, "learning_rate": 0.0018603874079843228, "loss": 0.1011, "step": 30240 }, { "epoch": 0.76, "learning_rate": 0.0018600105519684447, "loss": 0.0989, "step": 30250 }, { "epoch": 0.76, "learning_rate": 0.0018596336959525663, "loss": 0.095, "step": 30260 }, { "epoch": 0.76, "learning_rate": 0.0018592568399366882, "loss": 0.0968, "step": 30270 }, { "epoch": 0.76, "learning_rate": 0.00185887998392081, "loss": 0.0936, "step": 30280 }, { "epoch": 0.76, "learning_rate": 0.001858503127904932, "loss": 0.1002, "step": 30290 }, { "epoch": 0.76, "learning_rate": 0.0018581262718890535, "loss": 0.0974, "step": 30300 }, { "epoch": 0.76, "learning_rate": 0.0018577494158731754, "loss": 0.0954, "step": 30310 }, { "epoch": 0.76, "learning_rate": 0.0018573725598572972, "loss": 0.0954, "step": 30320 }, { "epoch": 0.76, "learning_rate": 0.0018569957038414191, "loss": 0.0983, "step": 30330 }, { "epoch": 0.76, "learning_rate": 0.0018566188478255407, "loss": 0.0978, "step": 30340 }, { "epoch": 0.76, "learning_rate": 0.0018562419918096626, "loss": 0.0994, "step": 30350 }, { "epoch": 0.76, "learning_rate": 0.0018558651357937844, "loss": 0.0974, "step": 30360 }, { "epoch": 0.76, "learning_rate": 0.0018554882797779063, "loss": 0.0952, "step": 30370 }, { "epoch": 0.76, "learning_rate": 0.0018551114237620279, "loss": 0.0938, "step": 30380 }, { "epoch": 0.76, "learning_rate": 0.0018547345677461498, "loss": 0.0971, "step": 30390 }, { "epoch": 0.76, "learning_rate": 0.0018543577117302718, "loss": 0.0995, "step": 30400 }, { "epoch": 0.76, "learning_rate": 0.0018539808557143935, "loss": 0.0957, "step": 30410 }, { "epoch": 0.76, "learning_rate": 0.001853603999698515, "loss": 0.0985, "step": 30420 }, { "epoch": 0.76, "learning_rate": 0.001853227143682637, "loss": 0.0944, "step": 30430 }, { "epoch": 0.76, "learning_rate": 0.001852850287666759, "loss": 0.0984, "step": 30440 }, { "epoch": 0.77, "learning_rate": 0.0018524734316508807, "loss": 0.102, "step": 30450 }, { "epoch": 0.77, "learning_rate": 0.0018520965756350022, "loss": 0.1017, "step": 30460 }, { "epoch": 0.77, "learning_rate": 0.0018517197196191242, "loss": 0.0997, "step": 30470 }, { "epoch": 0.77, "learning_rate": 0.0018513428636032462, "loss": 0.101, "step": 30480 }, { "epoch": 0.77, "learning_rate": 0.0018509660075873677, "loss": 0.098, "step": 30490 }, { "epoch": 0.77, "learning_rate": 0.0018505891515714894, "loss": 0.0958, "step": 30500 }, { "epoch": 0.77, "eval_cer": 0.6662455901255385, "eval_loss": 0.07596764713525772, "eval_runtime": 90.6663, "eval_samples_per_second": 110.283, "eval_steps_per_second": 6.893, "step": 30500 }, { "epoch": 0.77, "learning_rate": 0.0018502122955556114, "loss": 0.0934, "step": 30510 }, { "epoch": 0.77, "learning_rate": 0.0018498354395397334, "loss": 0.0951, "step": 30520 }, { "epoch": 0.77, "learning_rate": 0.0018494585835238549, "loss": 0.0959, "step": 30530 }, { "epoch": 0.77, "learning_rate": 0.0018490817275079769, "loss": 0.1019, "step": 30540 }, { "epoch": 0.77, "learning_rate": 0.0018487048714920986, "loss": 0.0972, "step": 30550 }, { "epoch": 0.77, "learning_rate": 0.0018483280154762206, "loss": 0.0984, "step": 30560 }, { "epoch": 0.77, "learning_rate": 0.001847951159460342, "loss": 0.0973, "step": 30570 }, { "epoch": 0.77, "learning_rate": 0.001847574303444464, "loss": 0.0956, "step": 30580 }, { "epoch": 0.77, "learning_rate": 0.0018471974474285858, "loss": 0.0991, "step": 30590 }, { "epoch": 0.77, "learning_rate": 0.0018468205914127078, "loss": 0.0969, "step": 30600 }, { "epoch": 0.77, "learning_rate": 0.0018464437353968293, "loss": 0.0965, "step": 30610 }, { "epoch": 0.77, "learning_rate": 0.0018460668793809512, "loss": 0.0959, "step": 30620 }, { "epoch": 0.77, "learning_rate": 0.001845690023365073, "loss": 0.0971, "step": 30630 }, { "epoch": 0.77, "learning_rate": 0.001845313167349195, "loss": 0.0962, "step": 30640 }, { "epoch": 0.77, "learning_rate": 0.0018449363113333165, "loss": 0.0977, "step": 30650 }, { "epoch": 0.77, "learning_rate": 0.0018445594553174384, "loss": 0.0941, "step": 30660 }, { "epoch": 0.77, "learning_rate": 0.0018441825993015604, "loss": 0.0981, "step": 30670 }, { "epoch": 0.77, "learning_rate": 0.0018438057432856821, "loss": 0.0967, "step": 30680 }, { "epoch": 0.77, "learning_rate": 0.0018434288872698037, "loss": 0.0981, "step": 30690 }, { "epoch": 0.77, "learning_rate": 0.0018430520312539256, "loss": 0.0969, "step": 30700 }, { "epoch": 0.77, "learning_rate": 0.0018426751752380476, "loss": 0.0967, "step": 30710 }, { "epoch": 0.77, "learning_rate": 0.0018422983192221691, "loss": 0.0952, "step": 30720 }, { "epoch": 0.77, "learning_rate": 0.0018419214632062909, "loss": 0.0993, "step": 30730 }, { "epoch": 0.77, "learning_rate": 0.0018415446071904128, "loss": 0.0953, "step": 30740 }, { "epoch": 0.77, "learning_rate": 0.0018411677511745348, "loss": 0.0968, "step": 30750 }, { "epoch": 0.77, "learning_rate": 0.0018407908951586563, "loss": 0.093, "step": 30760 }, { "epoch": 0.77, "learning_rate": 0.001840414039142778, "loss": 0.0961, "step": 30770 }, { "epoch": 0.77, "learning_rate": 0.0018400371831269, "loss": 0.0961, "step": 30780 }, { "epoch": 0.77, "learning_rate": 0.001839660327111022, "loss": 0.096, "step": 30790 }, { "epoch": 0.77, "learning_rate": 0.0018392834710951435, "loss": 0.0985, "step": 30800 }, { "epoch": 0.77, "learning_rate": 0.0018389066150792655, "loss": 0.0962, "step": 30810 }, { "epoch": 0.77, "learning_rate": 0.0018385297590633872, "loss": 0.0965, "step": 30820 }, { "epoch": 0.77, "learning_rate": 0.0018381529030475092, "loss": 0.0997, "step": 30830 }, { "epoch": 0.77, "learning_rate": 0.0018377760470316307, "loss": 0.1014, "step": 30840 }, { "epoch": 0.78, "learning_rate": 0.0018373991910157527, "loss": 0.0963, "step": 30850 }, { "epoch": 0.78, "learning_rate": 0.0018370223349998744, "loss": 0.096, "step": 30860 }, { "epoch": 0.78, "learning_rate": 0.0018366454789839964, "loss": 0.0979, "step": 30870 }, { "epoch": 0.78, "learning_rate": 0.001836268622968118, "loss": 0.094, "step": 30880 }, { "epoch": 0.78, "learning_rate": 0.0018358917669522399, "loss": 0.095, "step": 30890 }, { "epoch": 0.78, "learning_rate": 0.0018355149109363616, "loss": 0.0946, "step": 30900 }, { "epoch": 0.78, "learning_rate": 0.0018351380549204836, "loss": 0.0967, "step": 30910 }, { "epoch": 0.78, "learning_rate": 0.001834761198904605, "loss": 0.0981, "step": 30920 }, { "epoch": 0.78, "learning_rate": 0.001834384342888727, "loss": 0.0968, "step": 30930 }, { "epoch": 0.78, "learning_rate": 0.0018340074868728488, "loss": 0.0945, "step": 30940 }, { "epoch": 0.78, "learning_rate": 0.0018336306308569706, "loss": 0.0951, "step": 30950 }, { "epoch": 0.78, "learning_rate": 0.0018332537748410923, "loss": 0.0931, "step": 30960 }, { "epoch": 0.78, "learning_rate": 0.0018328769188252143, "loss": 0.0999, "step": 30970 }, { "epoch": 0.78, "learning_rate": 0.0018325000628093362, "loss": 0.0918, "step": 30980 }, { "epoch": 0.78, "learning_rate": 0.0018321232067934577, "loss": 0.0927, "step": 30990 }, { "epoch": 0.78, "learning_rate": 0.0018317463507775795, "loss": 0.0999, "step": 31000 }, { "epoch": 0.78, "eval_cer": 0.6661349071490135, "eval_loss": 0.07599937915802002, "eval_runtime": 90.6874, "eval_samples_per_second": 110.258, "eval_steps_per_second": 6.892, "step": 31000 }, { "epoch": 0.78, "learning_rate": 0.0018313694947617015, "loss": 0.0963, "step": 31010 }, { "epoch": 0.78, "learning_rate": 0.0018309926387458234, "loss": 0.0964, "step": 31020 }, { "epoch": 0.78, "learning_rate": 0.001830615782729945, "loss": 0.0985, "step": 31030 }, { "epoch": 0.78, "learning_rate": 0.0018302389267140667, "loss": 0.0956, "step": 31040 }, { "epoch": 0.78, "learning_rate": 0.0018298620706981886, "loss": 0.0983, "step": 31050 }, { "epoch": 0.78, "learning_rate": 0.0018294852146823106, "loss": 0.0927, "step": 31060 }, { "epoch": 0.78, "learning_rate": 0.0018291083586664321, "loss": 0.0913, "step": 31070 }, { "epoch": 0.78, "learning_rate": 0.001828731502650554, "loss": 0.0932, "step": 31080 }, { "epoch": 0.78, "learning_rate": 0.0018283546466346758, "loss": 0.0954, "step": 31090 }, { "epoch": 0.78, "learning_rate": 0.0018279777906187978, "loss": 0.0978, "step": 31100 }, { "epoch": 0.78, "learning_rate": 0.0018276009346029193, "loss": 0.0953, "step": 31110 }, { "epoch": 0.78, "learning_rate": 0.0018272240785870413, "loss": 0.0969, "step": 31120 }, { "epoch": 0.78, "learning_rate": 0.001826847222571163, "loss": 0.1006, "step": 31130 }, { "epoch": 0.78, "learning_rate": 0.001826470366555285, "loss": 0.0923, "step": 31140 }, { "epoch": 0.78, "learning_rate": 0.0018260935105394065, "loss": 0.0949, "step": 31150 }, { "epoch": 0.78, "learning_rate": 0.0018257166545235285, "loss": 0.0972, "step": 31160 }, { "epoch": 0.78, "learning_rate": 0.0018253397985076502, "loss": 0.0916, "step": 31170 }, { "epoch": 0.78, "learning_rate": 0.0018249629424917718, "loss": 0.0975, "step": 31180 }, { "epoch": 0.78, "learning_rate": 0.0018245860864758937, "loss": 0.0962, "step": 31190 }, { "epoch": 0.78, "learning_rate": 0.0018242092304600157, "loss": 0.0968, "step": 31200 }, { "epoch": 0.78, "learning_rate": 0.0018238323744441374, "loss": 0.097, "step": 31210 }, { "epoch": 0.78, "learning_rate": 0.0018234555184282592, "loss": 0.0965, "step": 31220 }, { "epoch": 0.78, "learning_rate": 0.001823078662412381, "loss": 0.0948, "step": 31230 }, { "epoch": 0.78, "learning_rate": 0.0018227018063965029, "loss": 0.0927, "step": 31240 }, { "epoch": 0.79, "learning_rate": 0.0018223249503806248, "loss": 0.0938, "step": 31250 }, { "epoch": 0.79, "learning_rate": 0.0018219480943647464, "loss": 0.0976, "step": 31260 }, { "epoch": 0.79, "learning_rate": 0.0018215712383488681, "loss": 0.093, "step": 31270 }, { "epoch": 0.79, "learning_rate": 0.00182119438233299, "loss": 0.0961, "step": 31280 }, { "epoch": 0.79, "learning_rate": 0.001820817526317112, "loss": 0.0948, "step": 31290 }, { "epoch": 0.79, "learning_rate": 0.0018204406703012336, "loss": 0.0974, "step": 31300 }, { "epoch": 0.79, "learning_rate": 0.0018200638142853553, "loss": 0.0915, "step": 31310 }, { "epoch": 0.79, "learning_rate": 0.0018196869582694773, "loss": 0.0956, "step": 31320 }, { "epoch": 0.79, "learning_rate": 0.0018193101022535992, "loss": 0.0971, "step": 31330 }, { "epoch": 0.79, "learning_rate": 0.0018189332462377208, "loss": 0.0941, "step": 31340 }, { "epoch": 0.79, "learning_rate": 0.0018185563902218425, "loss": 0.0949, "step": 31350 }, { "epoch": 0.79, "learning_rate": 0.0018181795342059645, "loss": 0.0934, "step": 31360 }, { "epoch": 0.79, "learning_rate": 0.0018178026781900864, "loss": 0.0957, "step": 31370 }, { "epoch": 0.79, "learning_rate": 0.001817425822174208, "loss": 0.0958, "step": 31380 }, { "epoch": 0.79, "learning_rate": 0.00181704896615833, "loss": 0.0965, "step": 31390 }, { "epoch": 0.79, "learning_rate": 0.0018166721101424517, "loss": 0.0956, "step": 31400 }, { "epoch": 0.79, "learning_rate": 0.0018162952541265732, "loss": 0.0972, "step": 31410 }, { "epoch": 0.79, "learning_rate": 0.0018159183981106952, "loss": 0.0995, "step": 31420 }, { "epoch": 0.79, "learning_rate": 0.0018155415420948171, "loss": 0.0925, "step": 31430 }, { "epoch": 0.79, "learning_rate": 0.0018151646860789389, "loss": 0.0944, "step": 31440 }, { "epoch": 0.79, "learning_rate": 0.0018147878300630604, "loss": 0.0914, "step": 31450 }, { "epoch": 0.79, "learning_rate": 0.0018144109740471823, "loss": 0.0953, "step": 31460 }, { "epoch": 0.79, "learning_rate": 0.0018140341180313043, "loss": 0.094, "step": 31470 }, { "epoch": 0.79, "learning_rate": 0.001813657262015426, "loss": 0.0964, "step": 31480 }, { "epoch": 0.79, "learning_rate": 0.0018132804059995478, "loss": 0.0949, "step": 31490 }, { "epoch": 0.79, "learning_rate": 0.0018129035499836695, "loss": 0.0953, "step": 31500 }, { "epoch": 0.79, "eval_cer": 0.6660814905820818, "eval_loss": 0.07518129050731659, "eval_runtime": 90.6489, "eval_samples_per_second": 110.305, "eval_steps_per_second": 6.895, "step": 31500 }, { "epoch": 0.79, "learning_rate": 0.0018125266939677915, "loss": 0.0923, "step": 31510 }, { "epoch": 0.79, "learning_rate": 0.0018121498379519132, "loss": 0.1015, "step": 31520 }, { "epoch": 0.79, "learning_rate": 0.001811772981936035, "loss": 0.0961, "step": 31530 }, { "epoch": 0.79, "learning_rate": 0.0018113961259201567, "loss": 0.0955, "step": 31540 }, { "epoch": 0.79, "learning_rate": 0.0018110192699042787, "loss": 0.0983, "step": 31550 }, { "epoch": 0.79, "learning_rate": 0.0018106424138884007, "loss": 0.0977, "step": 31560 }, { "epoch": 0.79, "learning_rate": 0.0018102655578725222, "loss": 0.0982, "step": 31570 }, { "epoch": 0.79, "learning_rate": 0.001809888701856644, "loss": 0.0937, "step": 31580 }, { "epoch": 0.79, "learning_rate": 0.001809511845840766, "loss": 0.0956, "step": 31590 }, { "epoch": 0.79, "learning_rate": 0.0018091349898248874, "loss": 0.0955, "step": 31600 }, { "epoch": 0.79, "learning_rate": 0.0018087581338090094, "loss": 0.0926, "step": 31610 }, { "epoch": 0.79, "learning_rate": 0.0018083812777931311, "loss": 0.0961, "step": 31620 }, { "epoch": 0.79, "learning_rate": 0.001808004421777253, "loss": 0.0952, "step": 31630 }, { "epoch": 0.79, "learning_rate": 0.0018076275657613746, "loss": 0.0969, "step": 31640 }, { "epoch": 0.8, "learning_rate": 0.0018072507097454966, "loss": 0.0995, "step": 31650 }, { "epoch": 0.8, "learning_rate": 0.0018068738537296185, "loss": 0.0956, "step": 31660 }, { "epoch": 0.8, "learning_rate": 0.0018064969977137403, "loss": 0.0951, "step": 31670 }, { "epoch": 0.8, "learning_rate": 0.0018061201416978618, "loss": 0.099, "step": 31680 }, { "epoch": 0.8, "learning_rate": 0.0018057432856819838, "loss": 0.0959, "step": 31690 }, { "epoch": 0.8, "learning_rate": 0.0018053664296661057, "loss": 0.0974, "step": 31700 }, { "epoch": 0.8, "learning_rate": 0.0018049895736502275, "loss": 0.0936, "step": 31710 }, { "epoch": 0.8, "learning_rate": 0.001804612717634349, "loss": 0.0978, "step": 31720 }, { "epoch": 0.8, "learning_rate": 0.001804235861618471, "loss": 0.096, "step": 31730 }, { "epoch": 0.8, "learning_rate": 0.001803859005602593, "loss": 0.0995, "step": 31740 }, { "epoch": 0.8, "learning_rate": 0.0018034821495867147, "loss": 0.0954, "step": 31750 }, { "epoch": 0.8, "learning_rate": 0.0018031052935708362, "loss": 0.0929, "step": 31760 }, { "epoch": 0.8, "learning_rate": 0.0018027284375549582, "loss": 0.093, "step": 31770 }, { "epoch": 0.8, "learning_rate": 0.0018023515815390801, "loss": 0.0933, "step": 31780 }, { "epoch": 0.8, "learning_rate": 0.0018019747255232019, "loss": 0.0939, "step": 31790 }, { "epoch": 0.8, "learning_rate": 0.0018015978695073236, "loss": 0.0916, "step": 31800 }, { "epoch": 0.8, "learning_rate": 0.0018012210134914454, "loss": 0.0982, "step": 31810 }, { "epoch": 0.8, "learning_rate": 0.0018008441574755673, "loss": 0.093, "step": 31820 }, { "epoch": 0.8, "learning_rate": 0.0018004673014596888, "loss": 0.0967, "step": 31830 }, { "epoch": 0.8, "learning_rate": 0.0018000904454438108, "loss": 0.0949, "step": 31840 }, { "epoch": 0.8, "learning_rate": 0.0017997135894279326, "loss": 0.0948, "step": 31850 }, { "epoch": 0.8, "learning_rate": 0.0017993367334120545, "loss": 0.0965, "step": 31860 }, { "epoch": 0.8, "learning_rate": 0.001798959877396176, "loss": 0.0951, "step": 31870 }, { "epoch": 0.8, "learning_rate": 0.001798583021380298, "loss": 0.1012, "step": 31880 }, { "epoch": 0.8, "learning_rate": 0.0017982061653644198, "loss": 0.0969, "step": 31890 }, { "epoch": 0.8, "learning_rate": 0.0017978293093485417, "loss": 0.095, "step": 31900 }, { "epoch": 0.8, "learning_rate": 0.0017974524533326632, "loss": 0.0935, "step": 31910 }, { "epoch": 0.8, "learning_rate": 0.0017970755973167852, "loss": 0.0951, "step": 31920 }, { "epoch": 0.8, "learning_rate": 0.001796698741300907, "loss": 0.0974, "step": 31930 }, { "epoch": 0.8, "learning_rate": 0.001796321885285029, "loss": 0.0941, "step": 31940 }, { "epoch": 0.8, "learning_rate": 0.0017959450292691504, "loss": 0.0965, "step": 31950 }, { "epoch": 0.8, "learning_rate": 0.0017955681732532724, "loss": 0.0939, "step": 31960 }, { "epoch": 0.8, "learning_rate": 0.0017951913172373944, "loss": 0.0975, "step": 31970 }, { "epoch": 0.8, "learning_rate": 0.001794814461221516, "loss": 0.0947, "step": 31980 }, { "epoch": 0.8, "learning_rate": 0.0017944376052056376, "loss": 0.0963, "step": 31990 }, { "epoch": 0.8, "learning_rate": 0.0017940607491897596, "loss": 0.095, "step": 32000 }, { "epoch": 0.8, "eval_cer": 0.6662220098392354, "eval_loss": 0.07489816099405289, "eval_runtime": 90.5954, "eval_samples_per_second": 110.37, "eval_steps_per_second": 6.899, "step": 32000 }, { "epoch": 0.8, "learning_rate": 0.0017936838931738816, "loss": 0.0966, "step": 32010 }, { "epoch": 0.8, "learning_rate": 0.0017933070371580033, "loss": 0.096, "step": 32020 }, { "epoch": 0.8, "learning_rate": 0.0017929301811421248, "loss": 0.0933, "step": 32030 }, { "epoch": 0.8, "learning_rate": 0.0017925533251262468, "loss": 0.0946, "step": 32040 }, { "epoch": 0.81, "learning_rate": 0.0017921764691103687, "loss": 0.0965, "step": 32050 }, { "epoch": 0.81, "learning_rate": 0.0017917996130944903, "loss": 0.0956, "step": 32060 }, { "epoch": 0.81, "learning_rate": 0.0017914227570786122, "loss": 0.0931, "step": 32070 }, { "epoch": 0.81, "learning_rate": 0.001791045901062734, "loss": 0.0952, "step": 32080 }, { "epoch": 0.81, "learning_rate": 0.001790669045046856, "loss": 0.0952, "step": 32090 }, { "epoch": 0.81, "learning_rate": 0.0017902921890309775, "loss": 0.0916, "step": 32100 }, { "epoch": 0.81, "learning_rate": 0.0017899153330150994, "loss": 0.0926, "step": 32110 }, { "epoch": 0.81, "learning_rate": 0.0017895384769992212, "loss": 0.1009, "step": 32120 }, { "epoch": 0.81, "learning_rate": 0.0017891616209833431, "loss": 0.0927, "step": 32130 }, { "epoch": 0.81, "learning_rate": 0.0017887847649674647, "loss": 0.0993, "step": 32140 }, { "epoch": 0.81, "learning_rate": 0.0017884079089515866, "loss": 0.0974, "step": 32150 }, { "epoch": 0.81, "learning_rate": 0.0017880310529357084, "loss": 0.0937, "step": 32160 }, { "epoch": 0.81, "learning_rate": 0.0017876541969198303, "loss": 0.0957, "step": 32170 }, { "epoch": 0.81, "learning_rate": 0.0017872773409039519, "loss": 0.095, "step": 32180 }, { "epoch": 0.81, "learning_rate": 0.0017869004848880738, "loss": 0.095, "step": 32190 }, { "epoch": 0.81, "learning_rate": 0.0017865236288721956, "loss": 0.0979, "step": 32200 }, { "epoch": 0.81, "learning_rate": 0.0017861467728563175, "loss": 0.0903, "step": 32210 }, { "epoch": 0.81, "learning_rate": 0.001785769916840439, "loss": 0.0944, "step": 32220 }, { "epoch": 0.81, "learning_rate": 0.001785393060824561, "loss": 0.0943, "step": 32230 }, { "epoch": 0.81, "learning_rate": 0.001785016204808683, "loss": 0.0986, "step": 32240 }, { "epoch": 0.81, "learning_rate": 0.0017846393487928047, "loss": 0.0931, "step": 32250 }, { "epoch": 0.81, "learning_rate": 0.0017842624927769263, "loss": 0.0915, "step": 32260 }, { "epoch": 0.81, "learning_rate": 0.0017838856367610482, "loss": 0.0935, "step": 32270 }, { "epoch": 0.81, "learning_rate": 0.0017835087807451702, "loss": 0.0938, "step": 32280 }, { "epoch": 0.81, "learning_rate": 0.0017831319247292917, "loss": 0.0942, "step": 32290 }, { "epoch": 0.81, "learning_rate": 0.0017827550687134134, "loss": 0.0977, "step": 32300 }, { "epoch": 0.81, "learning_rate": 0.0017823782126975354, "loss": 0.0938, "step": 32310 }, { "epoch": 0.81, "learning_rate": 0.0017820013566816574, "loss": 0.0961, "step": 32320 }, { "epoch": 0.81, "learning_rate": 0.001781624500665779, "loss": 0.0929, "step": 32330 }, { "epoch": 0.81, "learning_rate": 0.0017812476446499006, "loss": 0.0904, "step": 32340 }, { "epoch": 0.81, "learning_rate": 0.0017808707886340226, "loss": 0.0981, "step": 32350 }, { "epoch": 0.81, "learning_rate": 0.0017804939326181446, "loss": 0.0945, "step": 32360 }, { "epoch": 0.81, "learning_rate": 0.001780117076602266, "loss": 0.0971, "step": 32370 }, { "epoch": 0.81, "learning_rate": 0.001779740220586388, "loss": 0.0965, "step": 32380 }, { "epoch": 0.81, "learning_rate": 0.0017793633645705098, "loss": 0.0958, "step": 32390 }, { "epoch": 0.81, "learning_rate": 0.0017789865085546318, "loss": 0.099, "step": 32400 }, { "epoch": 0.81, "learning_rate": 0.0017786096525387533, "loss": 0.0947, "step": 32410 }, { "epoch": 0.81, "learning_rate": 0.0017782327965228753, "loss": 0.0964, "step": 32420 }, { "epoch": 0.81, "learning_rate": 0.001777855940506997, "loss": 0.103, "step": 32430 }, { "epoch": 0.82, "learning_rate": 0.001777479084491119, "loss": 0.0953, "step": 32440 }, { "epoch": 0.82, "learning_rate": 0.0017771022284752405, "loss": 0.0934, "step": 32450 }, { "epoch": 0.82, "learning_rate": 0.0017767253724593624, "loss": 0.0963, "step": 32460 }, { "epoch": 0.82, "learning_rate": 0.0017763485164434842, "loss": 0.0929, "step": 32470 }, { "epoch": 0.82, "learning_rate": 0.0017759716604276062, "loss": 0.0949, "step": 32480 }, { "epoch": 0.82, "learning_rate": 0.0017755948044117277, "loss": 0.0952, "step": 32490 }, { "epoch": 0.82, "learning_rate": 0.0017752179483958496, "loss": 0.09, "step": 32500 }, { "epoch": 0.82, "eval_cer": 0.6662576208838565, "eval_loss": 0.07475540041923523, "eval_runtime": 90.7185, "eval_samples_per_second": 110.22, "eval_steps_per_second": 6.889, "step": 32500 }, { "epoch": 0.82, "learning_rate": 0.0017748410923799714, "loss": 0.0996, "step": 32510 }, { "epoch": 0.82, "learning_rate": 0.0017744642363640931, "loss": 0.0974, "step": 32520 }, { "epoch": 0.82, "learning_rate": 0.0017740873803482149, "loss": 0.0936, "step": 32530 }, { "epoch": 0.82, "learning_rate": 0.0017737105243323368, "loss": 0.0976, "step": 32540 }, { "epoch": 0.82, "learning_rate": 0.0017733336683164588, "loss": 0.0948, "step": 32550 }, { "epoch": 0.82, "learning_rate": 0.0017729568123005803, "loss": 0.0954, "step": 32560 }, { "epoch": 0.82, "learning_rate": 0.001772579956284702, "loss": 0.0959, "step": 32570 }, { "epoch": 0.82, "learning_rate": 0.001772203100268824, "loss": 0.0974, "step": 32580 }, { "epoch": 0.82, "learning_rate": 0.001771826244252946, "loss": 0.0967, "step": 32590 }, { "epoch": 0.82, "learning_rate": 0.0017714493882370675, "loss": 0.0929, "step": 32600 }, { "epoch": 0.82, "learning_rate": 0.0017710725322211893, "loss": 0.0947, "step": 32610 }, { "epoch": 0.82, "learning_rate": 0.0017706956762053112, "loss": 0.0964, "step": 32620 }, { "epoch": 0.82, "learning_rate": 0.0017703188201894332, "loss": 0.0929, "step": 32630 }, { "epoch": 0.82, "learning_rate": 0.0017699419641735547, "loss": 0.091, "step": 32640 }, { "epoch": 0.82, "learning_rate": 0.0017695651081576767, "loss": 0.0927, "step": 32650 }, { "epoch": 0.82, "learning_rate": 0.0017691882521417984, "loss": 0.0942, "step": 32660 }, { "epoch": 0.82, "learning_rate": 0.0017688113961259204, "loss": 0.0924, "step": 32670 }, { "epoch": 0.82, "learning_rate": 0.001768434540110042, "loss": 0.0967, "step": 32680 }, { "epoch": 0.82, "learning_rate": 0.0017680576840941639, "loss": 0.0936, "step": 32690 }, { "epoch": 0.82, "learning_rate": 0.0017676808280782856, "loss": 0.0964, "step": 32700 }, { "epoch": 0.82, "learning_rate": 0.0017673039720624071, "loss": 0.0944, "step": 32710 }, { "epoch": 0.82, "learning_rate": 0.001766927116046529, "loss": 0.0932, "step": 32720 }, { "epoch": 0.82, "learning_rate": 0.001766550260030651, "loss": 0.0894, "step": 32730 }, { "epoch": 0.82, "learning_rate": 0.0017661734040147728, "loss": 0.0946, "step": 32740 }, { "epoch": 0.82, "learning_rate": 0.0017657965479988943, "loss": 0.0945, "step": 32750 }, { "epoch": 0.82, "learning_rate": 0.0017654196919830163, "loss": 0.0966, "step": 32760 }, { "epoch": 0.82, "learning_rate": 0.0017650428359671383, "loss": 0.0972, "step": 32770 }, { "epoch": 0.82, "learning_rate": 0.00176466597995126, "loss": 0.0925, "step": 32780 }, { "epoch": 0.82, "learning_rate": 0.0017642891239353818, "loss": 0.097, "step": 32790 }, { "epoch": 0.82, "learning_rate": 0.0017639122679195035, "loss": 0.0931, "step": 32800 }, { "epoch": 0.82, "learning_rate": 0.0017635354119036255, "loss": 0.0914, "step": 32810 }, { "epoch": 0.82, "learning_rate": 0.0017631585558877474, "loss": 0.0939, "step": 32820 }, { "epoch": 0.82, "learning_rate": 0.001762781699871869, "loss": 0.0944, "step": 32830 }, { "epoch": 0.83, "learning_rate": 0.0017624048438559907, "loss": 0.0913, "step": 32840 }, { "epoch": 0.83, "learning_rate": 0.0017620279878401127, "loss": 0.0939, "step": 32850 }, { "epoch": 0.83, "learning_rate": 0.0017616511318242346, "loss": 0.0938, "step": 32860 }, { "epoch": 0.83, "learning_rate": 0.0017612742758083561, "loss": 0.0922, "step": 32870 }, { "epoch": 0.83, "learning_rate": 0.0017608974197924779, "loss": 0.097, "step": 32880 }, { "epoch": 0.83, "learning_rate": 0.0017605205637765999, "loss": 0.0948, "step": 32890 }, { "epoch": 0.83, "learning_rate": 0.0017601437077607218, "loss": 0.0952, "step": 32900 }, { "epoch": 0.83, "learning_rate": 0.0017597668517448433, "loss": 0.0958, "step": 32910 }, { "epoch": 0.83, "learning_rate": 0.001759389995728965, "loss": 0.0936, "step": 32920 }, { "epoch": 0.83, "learning_rate": 0.001759013139713087, "loss": 0.0942, "step": 32930 }, { "epoch": 0.83, "learning_rate": 0.0017586362836972086, "loss": 0.0982, "step": 32940 }, { "epoch": 0.83, "learning_rate": 0.0017582594276813305, "loss": 0.0943, "step": 32950 }, { "epoch": 0.83, "learning_rate": 0.0017578825716654525, "loss": 0.0946, "step": 32960 }, { "epoch": 0.83, "learning_rate": 0.0017575057156495742, "loss": 0.095, "step": 32970 }, { "epoch": 0.83, "learning_rate": 0.0017571288596336958, "loss": 0.093, "step": 32980 }, { "epoch": 0.83, "learning_rate": 0.0017567520036178177, "loss": 0.0948, "step": 32990 }, { "epoch": 0.83, "learning_rate": 0.0017563751476019397, "loss": 0.0927, "step": 33000 }, { "epoch": 0.83, "eval_cer": 0.6656248029963325, "eval_loss": 0.07400975376367569, "eval_runtime": 90.819, "eval_samples_per_second": 110.098, "eval_steps_per_second": 6.882, "step": 33000 }, { "epoch": 0.83, "learning_rate": 0.0017559982915860614, "loss": 0.0909, "step": 33010 }, { "epoch": 0.83, "learning_rate": 0.001755621435570183, "loss": 0.0924, "step": 33020 }, { "epoch": 0.83, "learning_rate": 0.001755244579554305, "loss": 0.0877, "step": 33030 }, { "epoch": 0.83, "learning_rate": 0.0017548677235384269, "loss": 0.0936, "step": 33040 }, { "epoch": 0.83, "learning_rate": 0.0017544908675225486, "loss": 0.0929, "step": 33050 }, { "epoch": 0.83, "learning_rate": 0.0017541140115066704, "loss": 0.0943, "step": 33060 }, { "epoch": 0.83, "learning_rate": 0.0017537371554907921, "loss": 0.0924, "step": 33070 }, { "epoch": 0.83, "learning_rate": 0.001753360299474914, "loss": 0.0967, "step": 33080 }, { "epoch": 0.83, "learning_rate": 0.0017529834434590358, "loss": 0.0918, "step": 33090 }, { "epoch": 0.83, "learning_rate": 0.0017526065874431576, "loss": 0.094, "step": 33100 }, { "epoch": 0.83, "learning_rate": 0.0017522297314272793, "loss": 0.0924, "step": 33110 }, { "epoch": 0.83, "learning_rate": 0.0017518528754114013, "loss": 0.0933, "step": 33120 }, { "epoch": 0.83, "learning_rate": 0.0017514760193955232, "loss": 0.0937, "step": 33130 }, { "epoch": 0.83, "learning_rate": 0.0017510991633796448, "loss": 0.0909, "step": 33140 }, { "epoch": 0.83, "learning_rate": 0.0017507223073637665, "loss": 0.0945, "step": 33150 }, { "epoch": 0.83, "learning_rate": 0.0017503454513478885, "loss": 0.0906, "step": 33160 }, { "epoch": 0.83, "learning_rate": 0.00174996859533201, "loss": 0.0962, "step": 33170 }, { "epoch": 0.83, "learning_rate": 0.001749591739316132, "loss": 0.091, "step": 33180 }, { "epoch": 0.83, "learning_rate": 0.0017492148833002537, "loss": 0.0924, "step": 33190 }, { "epoch": 0.83, "learning_rate": 0.0017488380272843757, "loss": 0.0909, "step": 33200 }, { "epoch": 0.83, "learning_rate": 0.0017484611712684972, "loss": 0.0921, "step": 33210 }, { "epoch": 0.83, "learning_rate": 0.0017480843152526192, "loss": 0.09, "step": 33220 }, { "epoch": 0.83, "learning_rate": 0.0017477074592367411, "loss": 0.0988, "step": 33230 }, { "epoch": 0.84, "learning_rate": 0.0017473306032208629, "loss": 0.0931, "step": 33240 }, { "epoch": 0.84, "learning_rate": 0.0017469537472049844, "loss": 0.0974, "step": 33250 }, { "epoch": 0.84, "learning_rate": 0.0017465768911891064, "loss": 0.0907, "step": 33260 }, { "epoch": 0.84, "learning_rate": 0.0017462000351732283, "loss": 0.0921, "step": 33270 }, { "epoch": 0.84, "learning_rate": 0.00174582317915735, "loss": 0.094, "step": 33280 }, { "epoch": 0.84, "learning_rate": 0.0017454463231414716, "loss": 0.091, "step": 33290 }, { "epoch": 0.84, "learning_rate": 0.0017450694671255935, "loss": 0.0906, "step": 33300 }, { "epoch": 0.84, "learning_rate": 0.0017446926111097155, "loss": 0.0884, "step": 33310 }, { "epoch": 0.84, "learning_rate": 0.0017443157550938373, "loss": 0.0916, "step": 33320 }, { "epoch": 0.84, "learning_rate": 0.0017439388990779588, "loss": 0.0951, "step": 33330 }, { "epoch": 0.84, "learning_rate": 0.0017435620430620807, "loss": 0.0937, "step": 33340 }, { "epoch": 0.84, "learning_rate": 0.0017431851870462027, "loss": 0.0922, "step": 33350 }, { "epoch": 0.84, "learning_rate": 0.0017428083310303245, "loss": 0.0923, "step": 33360 }, { "epoch": 0.84, "learning_rate": 0.0017424314750144462, "loss": 0.0941, "step": 33370 }, { "epoch": 0.84, "learning_rate": 0.001742054618998568, "loss": 0.0932, "step": 33380 }, { "epoch": 0.84, "learning_rate": 0.00174167776298269, "loss": 0.0934, "step": 33390 }, { "epoch": 0.84, "learning_rate": 0.0017413009069668114, "loss": 0.095, "step": 33400 }, { "epoch": 0.84, "learning_rate": 0.0017409240509509334, "loss": 0.0925, "step": 33410 }, { "epoch": 0.84, "learning_rate": 0.0017405471949350551, "loss": 0.0933, "step": 33420 }, { "epoch": 0.84, "learning_rate": 0.001740170338919177, "loss": 0.0931, "step": 33430 }, { "epoch": 0.84, "learning_rate": 0.0017397934829032986, "loss": 0.0936, "step": 33440 }, { "epoch": 0.84, "learning_rate": 0.0017394166268874206, "loss": 0.0896, "step": 33450 }, { "epoch": 0.84, "learning_rate": 0.0017390397708715423, "loss": 0.0935, "step": 33460 }, { "epoch": 0.84, "learning_rate": 0.0017386629148556643, "loss": 0.0955, "step": 33470 }, { "epoch": 0.84, "learning_rate": 0.0017382860588397858, "loss": 0.0952, "step": 33480 }, { "epoch": 0.84, "learning_rate": 0.0017379092028239078, "loss": 0.0954, "step": 33490 }, { "epoch": 0.84, "learning_rate": 0.0017375323468080295, "loss": 0.0914, "step": 33500 }, { "epoch": 0.84, "eval_cer": 0.6662003544742631, "eval_loss": 0.07387839257717133, "eval_runtime": 90.756, "eval_samples_per_second": 110.175, "eval_steps_per_second": 6.887, "step": 33500 }, { "epoch": 0.84, "learning_rate": 0.0017371554907921515, "loss": 0.094, "step": 33510 }, { "epoch": 0.84, "learning_rate": 0.001736778634776273, "loss": 0.091, "step": 33520 }, { "epoch": 0.84, "learning_rate": 0.001736401778760395, "loss": 0.09, "step": 33530 }, { "epoch": 0.84, "learning_rate": 0.001736024922744517, "loss": 0.0934, "step": 33540 }, { "epoch": 0.84, "learning_rate": 0.0017356480667286387, "loss": 0.0958, "step": 33550 }, { "epoch": 0.84, "learning_rate": 0.0017352712107127602, "loss": 0.0926, "step": 33560 }, { "epoch": 0.84, "learning_rate": 0.0017348943546968822, "loss": 0.0905, "step": 33570 }, { "epoch": 0.84, "learning_rate": 0.0017345174986810041, "loss": 0.0919, "step": 33580 }, { "epoch": 0.84, "learning_rate": 0.0017341406426651259, "loss": 0.0964, "step": 33590 }, { "epoch": 0.84, "learning_rate": 0.0017337637866492474, "loss": 0.0949, "step": 33600 }, { "epoch": 0.84, "learning_rate": 0.0017333869306333694, "loss": 0.09, "step": 33610 }, { "epoch": 0.84, "learning_rate": 0.0017330100746174913, "loss": 0.091, "step": 33620 }, { "epoch": 0.84, "learning_rate": 0.0017326332186016129, "loss": 0.0972, "step": 33630 }, { "epoch": 0.85, "learning_rate": 0.0017322563625857348, "loss": 0.0954, "step": 33640 }, { "epoch": 0.85, "learning_rate": 0.0017318795065698566, "loss": 0.095, "step": 33650 }, { "epoch": 0.85, "learning_rate": 0.0017315026505539785, "loss": 0.0931, "step": 33660 }, { "epoch": 0.85, "learning_rate": 0.0017311257945381, "loss": 0.0932, "step": 33670 }, { "epoch": 0.85, "learning_rate": 0.001730748938522222, "loss": 0.0919, "step": 33680 }, { "epoch": 0.85, "learning_rate": 0.0017303720825063438, "loss": 0.089, "step": 33690 }, { "epoch": 0.85, "learning_rate": 0.0017299952264904657, "loss": 0.0972, "step": 33700 }, { "epoch": 0.85, "learning_rate": 0.0017296183704745872, "loss": 0.0916, "step": 33710 }, { "epoch": 0.85, "learning_rate": 0.0017292415144587092, "loss": 0.0878, "step": 33720 }, { "epoch": 0.85, "learning_rate": 0.001728864658442831, "loss": 0.0971, "step": 33730 }, { "epoch": 0.85, "learning_rate": 0.001728487802426953, "loss": 0.0936, "step": 33740 }, { "epoch": 0.85, "learning_rate": 0.0017281109464110744, "loss": 0.0936, "step": 33750 }, { "epoch": 0.85, "learning_rate": 0.0017277340903951964, "loss": 0.0947, "step": 33760 }, { "epoch": 0.85, "learning_rate": 0.0017273572343793181, "loss": 0.0947, "step": 33770 }, { "epoch": 0.85, "learning_rate": 0.0017269803783634401, "loss": 0.091, "step": 33780 }, { "epoch": 0.85, "learning_rate": 0.0017266035223475616, "loss": 0.0943, "step": 33790 }, { "epoch": 0.85, "learning_rate": 0.0017262266663316836, "loss": 0.0911, "step": 33800 }, { "epoch": 0.85, "learning_rate": 0.0017258498103158056, "loss": 0.0921, "step": 33810 }, { "epoch": 0.85, "learning_rate": 0.001725472954299927, "loss": 0.0895, "step": 33820 }, { "epoch": 0.85, "learning_rate": 0.0017250960982840488, "loss": 0.093, "step": 33830 }, { "epoch": 0.85, "learning_rate": 0.0017247192422681708, "loss": 0.0933, "step": 33840 }, { "epoch": 0.85, "learning_rate": 0.0017243423862522928, "loss": 0.0962, "step": 33850 }, { "epoch": 0.85, "learning_rate": 0.0017239655302364143, "loss": 0.095, "step": 33860 }, { "epoch": 0.85, "learning_rate": 0.001723588674220536, "loss": 0.0909, "step": 33870 }, { "epoch": 0.85, "learning_rate": 0.001723211818204658, "loss": 0.0924, "step": 33880 }, { "epoch": 0.85, "learning_rate": 0.00172283496218878, "loss": 0.0895, "step": 33890 }, { "epoch": 0.85, "learning_rate": 0.0017224581061729015, "loss": 0.0909, "step": 33900 }, { "epoch": 0.85, "learning_rate": 0.0017220812501570232, "loss": 0.0938, "step": 33910 }, { "epoch": 0.85, "learning_rate": 0.0017217043941411452, "loss": 0.0934, "step": 33920 }, { "epoch": 0.85, "learning_rate": 0.0017213275381252671, "loss": 0.0947, "step": 33930 }, { "epoch": 0.85, "learning_rate": 0.0017209506821093887, "loss": 0.0933, "step": 33940 }, { "epoch": 0.85, "learning_rate": 0.0017205738260935106, "loss": 0.0956, "step": 33950 }, { "epoch": 0.85, "learning_rate": 0.0017201969700776324, "loss": 0.0919, "step": 33960 }, { "epoch": 0.85, "learning_rate": 0.0017198201140617543, "loss": 0.0962, "step": 33970 }, { "epoch": 0.85, "learning_rate": 0.0017194432580458759, "loss": 0.0935, "step": 33980 }, { "epoch": 0.85, "learning_rate": 0.0017190664020299978, "loss": 0.0932, "step": 33990 }, { "epoch": 0.85, "learning_rate": 0.0017186895460141196, "loss": 0.0889, "step": 34000 }, { "epoch": 0.85, "eval_cer": 0.665936159021601, "eval_loss": 0.07373498380184174, "eval_runtime": 90.8685, "eval_samples_per_second": 110.038, "eval_steps_per_second": 6.878, "step": 34000 }, { "epoch": 0.85, "learning_rate": 0.0017183126899982415, "loss": 0.0922, "step": 34010 }, { "epoch": 0.85, "learning_rate": 0.001717935833982363, "loss": 0.0928, "step": 34020 }, { "epoch": 0.85, "learning_rate": 0.001717558977966485, "loss": 0.0973, "step": 34030 }, { "epoch": 0.86, "learning_rate": 0.0017171821219506068, "loss": 0.092, "step": 34040 }, { "epoch": 0.86, "learning_rate": 0.0017168052659347285, "loss": 0.0924, "step": 34050 }, { "epoch": 0.86, "learning_rate": 0.0017164284099188503, "loss": 0.0968, "step": 34060 }, { "epoch": 0.86, "learning_rate": 0.0017160515539029722, "loss": 0.095, "step": 34070 }, { "epoch": 0.86, "learning_rate": 0.001715674697887094, "loss": 0.0928, "step": 34080 }, { "epoch": 0.86, "learning_rate": 0.0017152978418712157, "loss": 0.0945, "step": 34090 }, { "epoch": 0.86, "learning_rate": 0.0017149209858553375, "loss": 0.0929, "step": 34100 }, { "epoch": 0.86, "learning_rate": 0.0017145441298394594, "loss": 0.0899, "step": 34110 }, { "epoch": 0.86, "learning_rate": 0.0017141672738235814, "loss": 0.0887, "step": 34120 }, { "epoch": 0.86, "learning_rate": 0.001713790417807703, "loss": 0.0915, "step": 34130 }, { "epoch": 0.86, "learning_rate": 0.0017134135617918247, "loss": 0.0945, "step": 34140 }, { "epoch": 0.86, "learning_rate": 0.0017130367057759466, "loss": 0.0913, "step": 34150 }, { "epoch": 0.86, "learning_rate": 0.0017126598497600686, "loss": 0.0915, "step": 34160 }, { "epoch": 0.86, "learning_rate": 0.00171228299374419, "loss": 0.0951, "step": 34170 }, { "epoch": 0.86, "learning_rate": 0.0017119061377283118, "loss": 0.0959, "step": 34180 }, { "epoch": 0.86, "learning_rate": 0.0017115292817124338, "loss": 0.0957, "step": 34190 }, { "epoch": 0.86, "learning_rate": 0.0017111524256965558, "loss": 0.0911, "step": 34200 }, { "epoch": 0.86, "learning_rate": 0.0017107755696806773, "loss": 0.0934, "step": 34210 }, { "epoch": 0.86, "learning_rate": 0.0017103987136647993, "loss": 0.0918, "step": 34220 }, { "epoch": 0.86, "learning_rate": 0.001710021857648921, "loss": 0.0925, "step": 34230 }, { "epoch": 0.86, "learning_rate": 0.001709645001633043, "loss": 0.0916, "step": 34240 }, { "epoch": 0.86, "learning_rate": 0.0017092681456171645, "loss": 0.0907, "step": 34250 }, { "epoch": 0.86, "learning_rate": 0.0017088912896012865, "loss": 0.0905, "step": 34260 }, { "epoch": 0.86, "learning_rate": 0.0017085144335854082, "loss": 0.0933, "step": 34270 }, { "epoch": 0.86, "learning_rate": 0.0017081375775695297, "loss": 0.0923, "step": 34280 }, { "epoch": 0.86, "learning_rate": 0.0017077607215536517, "loss": 0.0953, "step": 34290 }, { "epoch": 0.86, "learning_rate": 0.0017073838655377736, "loss": 0.0925, "step": 34300 }, { "epoch": 0.86, "learning_rate": 0.0017070070095218954, "loss": 0.092, "step": 34310 }, { "epoch": 0.86, "learning_rate": 0.001706630153506017, "loss": 0.094, "step": 34320 }, { "epoch": 0.86, "learning_rate": 0.0017062532974901389, "loss": 0.0938, "step": 34330 }, { "epoch": 0.86, "learning_rate": 0.0017058764414742608, "loss": 0.0876, "step": 34340 }, { "epoch": 0.86, "learning_rate": 0.0017054995854583826, "loss": 0.0927, "step": 34350 }, { "epoch": 0.86, "learning_rate": 0.0017051227294425043, "loss": 0.0946, "step": 34360 }, { "epoch": 0.86, "learning_rate": 0.001704745873426626, "loss": 0.0934, "step": 34370 }, { "epoch": 0.86, "learning_rate": 0.001704369017410748, "loss": 0.0908, "step": 34380 }, { "epoch": 0.86, "learning_rate": 0.00170399216139487, "loss": 0.0909, "step": 34390 }, { "epoch": 0.86, "learning_rate": 0.0017036153053789915, "loss": 0.0901, "step": 34400 }, { "epoch": 0.86, "learning_rate": 0.0017032384493631133, "loss": 0.0888, "step": 34410 }, { "epoch": 0.86, "learning_rate": 0.0017028615933472352, "loss": 0.0895, "step": 34420 }, { "epoch": 0.86, "learning_rate": 0.0017024847373313572, "loss": 0.0867, "step": 34430 }, { "epoch": 0.87, "learning_rate": 0.0017021078813154787, "loss": 0.0912, "step": 34440 }, { "epoch": 0.87, "learning_rate": 0.0017017310252996005, "loss": 0.0906, "step": 34450 }, { "epoch": 0.87, "learning_rate": 0.0017013541692837224, "loss": 0.0943, "step": 34460 }, { "epoch": 0.87, "learning_rate": 0.0017009773132678444, "loss": 0.0911, "step": 34470 }, { "epoch": 0.87, "learning_rate": 0.001700600457251966, "loss": 0.0914, "step": 34480 }, { "epoch": 0.87, "learning_rate": 0.0017002236012360877, "loss": 0.0936, "step": 34490 }, { "epoch": 0.87, "learning_rate": 0.0016998467452202096, "loss": 0.0924, "step": 34500 }, { "epoch": 0.87, "eval_cer": 0.6659621454595678, "eval_loss": 0.0725727379322052, "eval_runtime": 90.8863, "eval_samples_per_second": 110.017, "eval_steps_per_second": 6.877, "step": 34500 }, { "epoch": 0.87, "learning_rate": 0.0016994698892043312, "loss": 0.0938, "step": 34510 }, { "epoch": 0.87, "learning_rate": 0.0016990930331884531, "loss": 0.0948, "step": 34520 }, { "epoch": 0.87, "learning_rate": 0.001698716177172575, "loss": 0.0885, "step": 34530 }, { "epoch": 0.87, "learning_rate": 0.0016983393211566968, "loss": 0.0896, "step": 34540 }, { "epoch": 0.87, "learning_rate": 0.0016979624651408183, "loss": 0.0916, "step": 34550 }, { "epoch": 0.87, "learning_rate": 0.0016975856091249403, "loss": 0.0926, "step": 34560 }, { "epoch": 0.87, "learning_rate": 0.0016972087531090623, "loss": 0.0942, "step": 34570 }, { "epoch": 0.87, "learning_rate": 0.001696831897093184, "loss": 0.0939, "step": 34580 }, { "epoch": 0.87, "learning_rate": 0.0016964550410773055, "loss": 0.0919, "step": 34590 }, { "epoch": 0.87, "learning_rate": 0.0016960781850614275, "loss": 0.0903, "step": 34600 }, { "epoch": 0.87, "learning_rate": 0.0016957013290455495, "loss": 0.0898, "step": 34610 }, { "epoch": 0.87, "learning_rate": 0.0016953244730296712, "loss": 0.0906, "step": 34620 }, { "epoch": 0.87, "learning_rate": 0.001694947617013793, "loss": 0.0888, "step": 34630 }, { "epoch": 0.87, "learning_rate": 0.0016945707609979147, "loss": 0.094, "step": 34640 }, { "epoch": 0.87, "learning_rate": 0.0016941939049820367, "loss": 0.0922, "step": 34650 }, { "epoch": 0.87, "learning_rate": 0.0016938170489661584, "loss": 0.0935, "step": 34660 }, { "epoch": 0.87, "learning_rate": 0.0016934401929502802, "loss": 0.0926, "step": 34670 }, { "epoch": 0.87, "learning_rate": 0.001693063336934402, "loss": 0.0905, "step": 34680 }, { "epoch": 0.87, "learning_rate": 0.0016926864809185239, "loss": 0.0906, "step": 34690 }, { "epoch": 0.87, "learning_rate": 0.0016923096249026458, "loss": 0.0912, "step": 34700 }, { "epoch": 0.87, "learning_rate": 0.0016919327688867673, "loss": 0.092, "step": 34710 }, { "epoch": 0.87, "learning_rate": 0.001691555912870889, "loss": 0.0925, "step": 34720 }, { "epoch": 0.87, "learning_rate": 0.001691179056855011, "loss": 0.0932, "step": 34730 }, { "epoch": 0.87, "learning_rate": 0.0016908022008391326, "loss": 0.0904, "step": 34740 }, { "epoch": 0.87, "learning_rate": 0.0016904253448232545, "loss": 0.0923, "step": 34750 }, { "epoch": 0.87, "learning_rate": 0.0016900484888073763, "loss": 0.0913, "step": 34760 }, { "epoch": 0.87, "learning_rate": 0.0016896716327914982, "loss": 0.0921, "step": 34770 }, { "epoch": 0.87, "learning_rate": 0.0016892947767756198, "loss": 0.0904, "step": 34780 }, { "epoch": 0.87, "learning_rate": 0.0016889179207597417, "loss": 0.0906, "step": 34790 }, { "epoch": 0.87, "learning_rate": 0.0016885410647438637, "loss": 0.0885, "step": 34800 }, { "epoch": 0.87, "learning_rate": 0.0016881642087279854, "loss": 0.0935, "step": 34810 }, { "epoch": 0.87, "learning_rate": 0.001687787352712107, "loss": 0.0912, "step": 34820 }, { "epoch": 0.88, "learning_rate": 0.001687410496696229, "loss": 0.0919, "step": 34830 }, { "epoch": 0.88, "learning_rate": 0.001687033640680351, "loss": 0.0929, "step": 34840 }, { "epoch": 0.88, "learning_rate": 0.0016866567846644726, "loss": 0.0913, "step": 34850 }, { "epoch": 0.88, "learning_rate": 0.0016862799286485942, "loss": 0.0885, "step": 34860 }, { "epoch": 0.88, "learning_rate": 0.0016859030726327161, "loss": 0.0882, "step": 34870 }, { "epoch": 0.88, "learning_rate": 0.001685526216616838, "loss": 0.0944, "step": 34880 }, { "epoch": 0.88, "learning_rate": 0.0016851493606009598, "loss": 0.0919, "step": 34890 }, { "epoch": 0.88, "learning_rate": 0.0016847725045850814, "loss": 0.0915, "step": 34900 }, { "epoch": 0.88, "learning_rate": 0.0016843956485692033, "loss": 0.094, "step": 34910 }, { "epoch": 0.88, "learning_rate": 0.0016840187925533253, "loss": 0.0897, "step": 34920 }, { "epoch": 0.88, "learning_rate": 0.001683641936537447, "loss": 0.0963, "step": 34930 }, { "epoch": 0.88, "learning_rate": 0.0016832650805215688, "loss": 0.0902, "step": 34940 }, { "epoch": 0.88, "learning_rate": 0.0016828882245056905, "loss": 0.0966, "step": 34950 }, { "epoch": 0.88, "learning_rate": 0.0016825113684898125, "loss": 0.0971, "step": 34960 }, { "epoch": 0.88, "learning_rate": 0.001682134512473934, "loss": 0.0928, "step": 34970 }, { "epoch": 0.88, "learning_rate": 0.001681757656458056, "loss": 0.0926, "step": 34980 }, { "epoch": 0.88, "learning_rate": 0.0016813808004421777, "loss": 0.0901, "step": 34990 }, { "epoch": 0.88, "learning_rate": 0.0016810039444262997, "loss": 0.0898, "step": 35000 }, { "epoch": 0.88, "eval_cer": 0.6658870735276637, "eval_loss": 0.07192695885896683, "eval_runtime": 90.571, "eval_samples_per_second": 110.4, "eval_steps_per_second": 6.901, "step": 35000 }, { "epoch": 0.88, "learning_rate": 0.0016806270884104212, "loss": 0.0918, "step": 35010 }, { "epoch": 0.88, "learning_rate": 0.0016802502323945432, "loss": 0.0892, "step": 35020 }, { "epoch": 0.88, "learning_rate": 0.001679873376378665, "loss": 0.0907, "step": 35030 }, { "epoch": 0.88, "learning_rate": 0.0016794965203627869, "loss": 0.0915, "step": 35040 }, { "epoch": 0.88, "learning_rate": 0.0016791196643469084, "loss": 0.0957, "step": 35050 }, { "epoch": 0.88, "learning_rate": 0.0016787428083310304, "loss": 0.0924, "step": 35060 }, { "epoch": 0.88, "learning_rate": 0.001678365952315152, "loss": 0.0896, "step": 35070 }, { "epoch": 0.88, "learning_rate": 0.001677989096299274, "loss": 0.0887, "step": 35080 }, { "epoch": 0.88, "learning_rate": 0.0016776122402833956, "loss": 0.0921, "step": 35090 }, { "epoch": 0.88, "learning_rate": 0.0016772353842675176, "loss": 0.0917, "step": 35100 }, { "epoch": 0.88, "learning_rate": 0.0016768585282516395, "loss": 0.0942, "step": 35110 }, { "epoch": 0.88, "learning_rate": 0.0016764816722357613, "loss": 0.0933, "step": 35120 }, { "epoch": 0.88, "learning_rate": 0.0016761048162198828, "loss": 0.0892, "step": 35130 }, { "epoch": 0.88, "learning_rate": 0.0016757279602040048, "loss": 0.0919, "step": 35140 }, { "epoch": 0.88, "learning_rate": 0.0016753511041881267, "loss": 0.0971, "step": 35150 }, { "epoch": 0.88, "learning_rate": 0.0016749742481722482, "loss": 0.0943, "step": 35160 }, { "epoch": 0.88, "learning_rate": 0.00167459739215637, "loss": 0.0885, "step": 35170 }, { "epoch": 0.88, "learning_rate": 0.001674220536140492, "loss": 0.0894, "step": 35180 }, { "epoch": 0.88, "learning_rate": 0.001673843680124614, "loss": 0.0895, "step": 35190 }, { "epoch": 0.88, "learning_rate": 0.0016734668241087354, "loss": 0.0913, "step": 35200 }, { "epoch": 0.88, "learning_rate": 0.0016730899680928574, "loss": 0.0927, "step": 35210 }, { "epoch": 0.88, "learning_rate": 0.0016727131120769791, "loss": 0.0922, "step": 35220 }, { "epoch": 0.89, "learning_rate": 0.001672336256061101, "loss": 0.0918, "step": 35230 }, { "epoch": 0.89, "learning_rate": 0.0016719594000452226, "loss": 0.0933, "step": 35240 }, { "epoch": 0.89, "learning_rate": 0.0016715825440293446, "loss": 0.0957, "step": 35250 }, { "epoch": 0.89, "learning_rate": 0.0016712056880134663, "loss": 0.0941, "step": 35260 }, { "epoch": 0.89, "learning_rate": 0.0016708288319975883, "loss": 0.0917, "step": 35270 }, { "epoch": 0.89, "learning_rate": 0.0016704519759817098, "loss": 0.0904, "step": 35280 }, { "epoch": 0.89, "learning_rate": 0.0016700751199658318, "loss": 0.09, "step": 35290 }, { "epoch": 0.89, "learning_rate": 0.0016696982639499535, "loss": 0.0926, "step": 35300 }, { "epoch": 0.89, "learning_rate": 0.0016693214079340755, "loss": 0.0889, "step": 35310 }, { "epoch": 0.89, "learning_rate": 0.001668944551918197, "loss": 0.0899, "step": 35320 }, { "epoch": 0.89, "learning_rate": 0.001668567695902319, "loss": 0.0892, "step": 35330 }, { "epoch": 0.89, "learning_rate": 0.0016681908398864407, "loss": 0.0924, "step": 35340 }, { "epoch": 0.89, "learning_rate": 0.0016678139838705627, "loss": 0.0907, "step": 35350 }, { "epoch": 0.89, "learning_rate": 0.0016674371278546842, "loss": 0.0906, "step": 35360 }, { "epoch": 0.89, "learning_rate": 0.0016670602718388062, "loss": 0.0928, "step": 35370 }, { "epoch": 0.89, "learning_rate": 0.0016666834158229281, "loss": 0.0898, "step": 35380 }, { "epoch": 0.89, "learning_rate": 0.0016663065598070497, "loss": 0.0908, "step": 35390 }, { "epoch": 0.89, "learning_rate": 0.0016659297037911714, "loss": 0.0911, "step": 35400 }, { "epoch": 0.89, "learning_rate": 0.0016655528477752934, "loss": 0.0916, "step": 35410 }, { "epoch": 0.89, "learning_rate": 0.0016651759917594153, "loss": 0.0887, "step": 35420 }, { "epoch": 0.89, "learning_rate": 0.0016647991357435369, "loss": 0.091, "step": 35430 }, { "epoch": 0.89, "learning_rate": 0.0016644222797276586, "loss": 0.0907, "step": 35440 }, { "epoch": 0.89, "learning_rate": 0.0016640454237117806, "loss": 0.0908, "step": 35450 }, { "epoch": 0.89, "learning_rate": 0.0016636685676959025, "loss": 0.0903, "step": 35460 }, { "epoch": 0.89, "learning_rate": 0.001663291711680024, "loss": 0.089, "step": 35470 }, { "epoch": 0.89, "learning_rate": 0.0016629148556641458, "loss": 0.0887, "step": 35480 }, { "epoch": 0.89, "learning_rate": 0.0016625379996482678, "loss": 0.0898, "step": 35490 }, { "epoch": 0.89, "learning_rate": 0.0016621611436323897, "loss": 0.0913, "step": 35500 }, { "epoch": 0.89, "eval_cer": 0.6657017998495673, "eval_loss": 0.07208002358675003, "eval_runtime": 90.5347, "eval_samples_per_second": 110.444, "eval_steps_per_second": 6.903, "step": 35500 }, { "epoch": 0.89, "learning_rate": 0.0016617842876165113, "loss": 0.0886, "step": 35510 }, { "epoch": 0.89, "learning_rate": 0.0016614074316006332, "loss": 0.0912, "step": 35520 }, { "epoch": 0.89, "learning_rate": 0.001661030575584755, "loss": 0.0922, "step": 35530 }, { "epoch": 0.89, "learning_rate": 0.001660653719568877, "loss": 0.0907, "step": 35540 }, { "epoch": 0.89, "learning_rate": 0.0016602768635529984, "loss": 0.0882, "step": 35550 }, { "epoch": 0.89, "learning_rate": 0.0016599000075371204, "loss": 0.0863, "step": 35560 }, { "epoch": 0.89, "learning_rate": 0.0016595231515212422, "loss": 0.0889, "step": 35570 }, { "epoch": 0.89, "learning_rate": 0.0016591462955053641, "loss": 0.0906, "step": 35580 }, { "epoch": 0.89, "learning_rate": 0.0016587694394894856, "loss": 0.0917, "step": 35590 }, { "epoch": 0.89, "learning_rate": 0.0016583925834736076, "loss": 0.0931, "step": 35600 }, { "epoch": 0.89, "learning_rate": 0.0016580157274577294, "loss": 0.0898, "step": 35610 }, { "epoch": 0.89, "learning_rate": 0.001657638871441851, "loss": 0.0894, "step": 35620 }, { "epoch": 0.9, "learning_rate": 0.0016572620154259728, "loss": 0.0849, "step": 35630 }, { "epoch": 0.9, "learning_rate": 0.0016568851594100948, "loss": 0.0883, "step": 35640 }, { "epoch": 0.9, "learning_rate": 0.0016565083033942165, "loss": 0.0911, "step": 35650 }, { "epoch": 0.9, "learning_rate": 0.0016561314473783383, "loss": 0.0902, "step": 35660 }, { "epoch": 0.9, "learning_rate": 0.00165575459136246, "loss": 0.0947, "step": 35670 }, { "epoch": 0.9, "learning_rate": 0.001655377735346582, "loss": 0.0884, "step": 35680 }, { "epoch": 0.9, "learning_rate": 0.001655000879330704, "loss": 0.0922, "step": 35690 }, { "epoch": 0.9, "learning_rate": 0.0016546240233148255, "loss": 0.0874, "step": 35700 }, { "epoch": 0.9, "learning_rate": 0.0016542471672989472, "loss": 0.0905, "step": 35710 }, { "epoch": 0.9, "learning_rate": 0.0016538703112830692, "loss": 0.0903, "step": 35720 }, { "epoch": 0.9, "learning_rate": 0.0016534934552671912, "loss": 0.0913, "step": 35730 }, { "epoch": 0.9, "learning_rate": 0.0016531165992513127, "loss": 0.0874, "step": 35740 }, { "epoch": 0.9, "learning_rate": 0.0016527397432354344, "loss": 0.0951, "step": 35750 }, { "epoch": 0.9, "learning_rate": 0.0016523628872195564, "loss": 0.0942, "step": 35760 }, { "epoch": 0.9, "learning_rate": 0.0016519860312036783, "loss": 0.0907, "step": 35770 }, { "epoch": 0.9, "learning_rate": 0.0016516091751877999, "loss": 0.0912, "step": 35780 }, { "epoch": 0.9, "learning_rate": 0.0016512323191719218, "loss": 0.0907, "step": 35790 }, { "epoch": 0.9, "learning_rate": 0.0016508554631560436, "loss": 0.0879, "step": 35800 }, { "epoch": 0.9, "learning_rate": 0.0016504786071401655, "loss": 0.0927, "step": 35810 }, { "epoch": 0.9, "learning_rate": 0.001650101751124287, "loss": 0.0902, "step": 35820 }, { "epoch": 0.9, "learning_rate": 0.001649724895108409, "loss": 0.0913, "step": 35830 }, { "epoch": 0.9, "learning_rate": 0.0016493480390925308, "loss": 0.0917, "step": 35840 }, { "epoch": 0.9, "learning_rate": 0.0016489711830766523, "loss": 0.0927, "step": 35850 }, { "epoch": 0.9, "learning_rate": 0.0016485943270607743, "loss": 0.0917, "step": 35860 }, { "epoch": 0.9, "learning_rate": 0.0016482174710448962, "loss": 0.0922, "step": 35870 }, { "epoch": 0.9, "learning_rate": 0.001647840615029018, "loss": 0.0907, "step": 35880 }, { "epoch": 0.9, "learning_rate": 0.0016474637590131395, "loss": 0.0894, "step": 35890 }, { "epoch": 0.9, "learning_rate": 0.0016470869029972615, "loss": 0.0886, "step": 35900 }, { "epoch": 0.9, "learning_rate": 0.0016467100469813834, "loss": 0.0892, "step": 35910 }, { "epoch": 0.9, "learning_rate": 0.0016463331909655052, "loss": 0.0902, "step": 35920 }, { "epoch": 0.9, "learning_rate": 0.001645956334949627, "loss": 0.0916, "step": 35930 }, { "epoch": 0.9, "learning_rate": 0.0016455794789337487, "loss": 0.0907, "step": 35940 }, { "epoch": 0.9, "learning_rate": 0.0016452026229178706, "loss": 0.0938, "step": 35950 }, { "epoch": 0.9, "learning_rate": 0.0016448257669019926, "loss": 0.0909, "step": 35960 }, { "epoch": 0.9, "learning_rate": 0.0016444489108861141, "loss": 0.0877, "step": 35970 }, { "epoch": 0.9, "learning_rate": 0.0016440720548702359, "loss": 0.0888, "step": 35980 }, { "epoch": 0.9, "learning_rate": 0.0016436951988543578, "loss": 0.0899, "step": 35990 }, { "epoch": 0.9, "learning_rate": 0.0016433183428384798, "loss": 0.0897, "step": 36000 }, { "epoch": 0.9, "eval_cer": 0.6657489604221738, "eval_loss": 0.07150072604417801, "eval_runtime": 90.8705, "eval_samples_per_second": 110.036, "eval_steps_per_second": 6.878, "step": 36000 }, { "epoch": 0.9, "learning_rate": 0.0016429414868226013, "loss": 0.0934, "step": 36010 }, { "epoch": 0.9, "learning_rate": 0.001642564630806723, "loss": 0.0884, "step": 36020 }, { "epoch": 0.91, "learning_rate": 0.001642187774790845, "loss": 0.0897, "step": 36030 }, { "epoch": 0.91, "learning_rate": 0.001641810918774967, "loss": 0.0865, "step": 36040 }, { "epoch": 0.91, "learning_rate": 0.0016414340627590885, "loss": 0.0889, "step": 36050 }, { "epoch": 0.91, "learning_rate": 0.0016410572067432102, "loss": 0.0876, "step": 36060 }, { "epoch": 0.91, "learning_rate": 0.0016406803507273322, "loss": 0.0912, "step": 36070 }, { "epoch": 0.91, "learning_rate": 0.0016403034947114537, "loss": 0.0868, "step": 36080 }, { "epoch": 0.91, "learning_rate": 0.0016399266386955757, "loss": 0.0901, "step": 36090 }, { "epoch": 0.91, "learning_rate": 0.0016395497826796977, "loss": 0.0909, "step": 36100 }, { "epoch": 0.91, "learning_rate": 0.0016391729266638194, "loss": 0.0894, "step": 36110 }, { "epoch": 0.91, "learning_rate": 0.001638796070647941, "loss": 0.0941, "step": 36120 }, { "epoch": 0.91, "learning_rate": 0.0016384192146320629, "loss": 0.0872, "step": 36130 }, { "epoch": 0.91, "learning_rate": 0.0016380423586161849, "loss": 0.0949, "step": 36140 }, { "epoch": 0.91, "learning_rate": 0.0016376655026003066, "loss": 0.0929, "step": 36150 }, { "epoch": 0.91, "learning_rate": 0.0016372886465844281, "loss": 0.0884, "step": 36160 }, { "epoch": 0.91, "learning_rate": 0.00163691179056855, "loss": 0.0931, "step": 36170 }, { "epoch": 0.91, "learning_rate": 0.001636534934552672, "loss": 0.0909, "step": 36180 }, { "epoch": 0.91, "learning_rate": 0.0016361580785367938, "loss": 0.0944, "step": 36190 }, { "epoch": 0.91, "learning_rate": 0.0016357812225209155, "loss": 0.0893, "step": 36200 }, { "epoch": 0.91, "learning_rate": 0.0016354043665050373, "loss": 0.0883, "step": 36210 }, { "epoch": 0.91, "learning_rate": 0.0016350275104891592, "loss": 0.0904, "step": 36220 }, { "epoch": 0.91, "learning_rate": 0.0016346506544732812, "loss": 0.0939, "step": 36230 }, { "epoch": 0.91, "learning_rate": 0.0016342737984574027, "loss": 0.0903, "step": 36240 }, { "epoch": 0.91, "learning_rate": 0.0016338969424415245, "loss": 0.0889, "step": 36250 }, { "epoch": 0.91, "learning_rate": 0.0016335200864256464, "loss": 0.0876, "step": 36260 }, { "epoch": 0.91, "learning_rate": 0.001633143230409768, "loss": 0.0943, "step": 36270 }, { "epoch": 0.91, "learning_rate": 0.00163276637439389, "loss": 0.0916, "step": 36280 }, { "epoch": 0.91, "learning_rate": 0.0016323895183780117, "loss": 0.0893, "step": 36290 }, { "epoch": 0.91, "learning_rate": 0.0016320126623621336, "loss": 0.0915, "step": 36300 }, { "epoch": 0.91, "learning_rate": 0.0016316358063462552, "loss": 0.0883, "step": 36310 }, { "epoch": 0.91, "learning_rate": 0.0016312589503303771, "loss": 0.0879, "step": 36320 }, { "epoch": 0.91, "learning_rate": 0.0016308820943144989, "loss": 0.0872, "step": 36330 }, { "epoch": 0.91, "learning_rate": 0.0016305052382986208, "loss": 0.0907, "step": 36340 }, { "epoch": 0.91, "learning_rate": 0.0016301283822827424, "loss": 0.0913, "step": 36350 }, { "epoch": 0.91, "learning_rate": 0.0016297515262668643, "loss": 0.0866, "step": 36360 }, { "epoch": 0.91, "learning_rate": 0.0016293746702509863, "loss": 0.0929, "step": 36370 }, { "epoch": 0.91, "learning_rate": 0.001628997814235108, "loss": 0.091, "step": 36380 }, { "epoch": 0.91, "learning_rate": 0.0016286209582192296, "loss": 0.0866, "step": 36390 }, { "epoch": 0.91, "learning_rate": 0.0016282441022033515, "loss": 0.0895, "step": 36400 }, { "epoch": 0.91, "learning_rate": 0.0016278672461874735, "loss": 0.088, "step": 36410 }, { "epoch": 0.91, "learning_rate": 0.0016274903901715952, "loss": 0.0907, "step": 36420 }, { "epoch": 0.92, "learning_rate": 0.0016271135341557167, "loss": 0.0956, "step": 36430 }, { "epoch": 0.92, "learning_rate": 0.0016267366781398387, "loss": 0.0899, "step": 36440 }, { "epoch": 0.92, "learning_rate": 0.0016263598221239607, "loss": 0.0883, "step": 36450 }, { "epoch": 0.92, "learning_rate": 0.0016259829661080824, "loss": 0.09, "step": 36460 }, { "epoch": 0.92, "learning_rate": 0.001625606110092204, "loss": 0.0912, "step": 36470 }, { "epoch": 0.92, "learning_rate": 0.001625229254076326, "loss": 0.0923, "step": 36480 }, { "epoch": 0.92, "learning_rate": 0.0016248523980604479, "loss": 0.0876, "step": 36490 }, { "epoch": 0.92, "learning_rate": 0.0016244755420445694, "loss": 0.0887, "step": 36500 }, { "epoch": 0.92, "eval_cer": 0.6658702304660187, "eval_loss": 0.07075611501932144, "eval_runtime": 90.7034, "eval_samples_per_second": 110.238, "eval_steps_per_second": 6.891, "step": 36500 }, { "epoch": 0.92, "learning_rate": 0.0016240986860286914, "loss": 0.089, "step": 36510 }, { "epoch": 0.92, "learning_rate": 0.001623721830012813, "loss": 0.0892, "step": 36520 }, { "epoch": 0.92, "learning_rate": 0.001623344973996935, "loss": 0.094, "step": 36530 }, { "epoch": 0.92, "learning_rate": 0.0016229681179810566, "loss": 0.0915, "step": 36540 }, { "epoch": 0.92, "learning_rate": 0.0016225912619651785, "loss": 0.0863, "step": 36550 }, { "epoch": 0.92, "learning_rate": 0.0016222144059493003, "loss": 0.0909, "step": 36560 }, { "epoch": 0.92, "learning_rate": 0.0016218375499334223, "loss": 0.0877, "step": 36570 }, { "epoch": 0.92, "learning_rate": 0.0016214606939175438, "loss": 0.0923, "step": 36580 }, { "epoch": 0.92, "learning_rate": 0.0016210838379016657, "loss": 0.0893, "step": 36590 }, { "epoch": 0.92, "learning_rate": 0.0016207069818857875, "loss": 0.0924, "step": 36600 }, { "epoch": 0.92, "learning_rate": 0.0016203301258699095, "loss": 0.0908, "step": 36610 }, { "epoch": 0.92, "learning_rate": 0.001619953269854031, "loss": 0.0874, "step": 36620 }, { "epoch": 0.92, "learning_rate": 0.001619576413838153, "loss": 0.0859, "step": 36630 }, { "epoch": 0.92, "learning_rate": 0.0016191995578222747, "loss": 0.0923, "step": 36640 }, { "epoch": 0.92, "learning_rate": 0.0016188227018063966, "loss": 0.091, "step": 36650 }, { "epoch": 0.92, "learning_rate": 0.0016184458457905182, "loss": 0.0898, "step": 36660 }, { "epoch": 0.92, "learning_rate": 0.0016180689897746401, "loss": 0.0874, "step": 36670 }, { "epoch": 0.92, "learning_rate": 0.001617692133758762, "loss": 0.0881, "step": 36680 }, { "epoch": 0.92, "learning_rate": 0.0016173152777428838, "loss": 0.0915, "step": 36690 }, { "epoch": 0.92, "learning_rate": 0.0016169384217270054, "loss": 0.0905, "step": 36700 }, { "epoch": 0.92, "learning_rate": 0.0016165615657111273, "loss": 0.091, "step": 36710 }, { "epoch": 0.92, "learning_rate": 0.0016161847096952493, "loss": 0.09, "step": 36720 }, { "epoch": 0.92, "learning_rate": 0.0016158078536793708, "loss": 0.0872, "step": 36730 }, { "epoch": 0.92, "learning_rate": 0.0016154309976634926, "loss": 0.0867, "step": 36740 }, { "epoch": 0.92, "learning_rate": 0.0016150541416476145, "loss": 0.0875, "step": 36750 }, { "epoch": 0.92, "learning_rate": 0.0016146772856317365, "loss": 0.0902, "step": 36760 }, { "epoch": 0.92, "learning_rate": 0.001614300429615858, "loss": 0.0915, "step": 36770 }, { "epoch": 0.92, "learning_rate": 0.00161392357359998, "loss": 0.089, "step": 36780 }, { "epoch": 0.92, "learning_rate": 0.0016135467175841017, "loss": 0.0867, "step": 36790 }, { "epoch": 0.92, "learning_rate": 0.0016131698615682237, "loss": 0.0884, "step": 36800 }, { "epoch": 0.92, "learning_rate": 0.0016127930055523452, "loss": 0.0907, "step": 36810 }, { "epoch": 0.93, "learning_rate": 0.0016124161495364672, "loss": 0.0911, "step": 36820 }, { "epoch": 0.93, "learning_rate": 0.001612039293520589, "loss": 0.0903, "step": 36830 }, { "epoch": 0.93, "learning_rate": 0.0016116624375047109, "loss": 0.0893, "step": 36840 }, { "epoch": 0.93, "learning_rate": 0.0016112855814888324, "loss": 0.0912, "step": 36850 }, { "epoch": 0.93, "learning_rate": 0.0016109087254729544, "loss": 0.0902, "step": 36860 }, { "epoch": 0.93, "learning_rate": 0.0016105318694570761, "loss": 0.0936, "step": 36870 }, { "epoch": 0.93, "learning_rate": 0.001610155013441198, "loss": 0.0901, "step": 36880 }, { "epoch": 0.93, "learning_rate": 0.0016097781574253196, "loss": 0.0864, "step": 36890 }, { "epoch": 0.93, "learning_rate": 0.0016094013014094416, "loss": 0.0862, "step": 36900 }, { "epoch": 0.93, "learning_rate": 0.0016090244453935633, "loss": 0.089, "step": 36910 }, { "epoch": 0.93, "learning_rate": 0.0016086475893776853, "loss": 0.089, "step": 36920 }, { "epoch": 0.93, "learning_rate": 0.0016082707333618068, "loss": 0.088, "step": 36930 }, { "epoch": 0.93, "learning_rate": 0.0016078938773459288, "loss": 0.0889, "step": 36940 }, { "epoch": 0.93, "learning_rate": 0.0016075170213300507, "loss": 0.0884, "step": 36950 }, { "epoch": 0.93, "learning_rate": 0.0016071401653141722, "loss": 0.0884, "step": 36960 }, { "epoch": 0.93, "learning_rate": 0.001606763309298294, "loss": 0.086, "step": 36970 }, { "epoch": 0.93, "learning_rate": 0.001606386453282416, "loss": 0.091, "step": 36980 }, { "epoch": 0.93, "learning_rate": 0.001606009597266538, "loss": 0.0906, "step": 36990 }, { "epoch": 0.93, "learning_rate": 0.0016056327412506594, "loss": 0.0922, "step": 37000 }, { "epoch": 0.93, "eval_cer": 0.6653331774147055, "eval_loss": 0.07120376080274582, "eval_runtime": 90.8589, "eval_samples_per_second": 110.05, "eval_steps_per_second": 6.879, "step": 37000 }, { "epoch": 0.93, "learning_rate": 0.0016052558852347812, "loss": 0.0909, "step": 37010 }, { "epoch": 0.93, "learning_rate": 0.0016048790292189031, "loss": 0.0879, "step": 37020 }, { "epoch": 0.93, "learning_rate": 0.0016045021732030251, "loss": 0.0878, "step": 37030 }, { "epoch": 0.93, "learning_rate": 0.0016041253171871466, "loss": 0.0872, "step": 37040 }, { "epoch": 0.93, "learning_rate": 0.0016037484611712684, "loss": 0.0867, "step": 37050 }, { "epoch": 0.93, "learning_rate": 0.0016033716051553903, "loss": 0.0886, "step": 37060 }, { "epoch": 0.93, "learning_rate": 0.0016029947491395123, "loss": 0.0873, "step": 37070 }, { "epoch": 0.93, "learning_rate": 0.0016026178931236338, "loss": 0.0892, "step": 37080 }, { "epoch": 0.93, "learning_rate": 0.0016022410371077558, "loss": 0.0889, "step": 37090 }, { "epoch": 0.93, "learning_rate": 0.0016018641810918775, "loss": 0.0872, "step": 37100 }, { "epoch": 0.93, "learning_rate": 0.0016014873250759995, "loss": 0.0892, "step": 37110 }, { "epoch": 0.93, "learning_rate": 0.001601110469060121, "loss": 0.0914, "step": 37120 }, { "epoch": 0.93, "learning_rate": 0.001600733613044243, "loss": 0.09, "step": 37130 }, { "epoch": 0.93, "learning_rate": 0.0016003567570283647, "loss": 0.0882, "step": 37140 }, { "epoch": 0.93, "learning_rate": 0.0015999799010124867, "loss": 0.0852, "step": 37150 }, { "epoch": 0.93, "learning_rate": 0.0015996030449966082, "loss": 0.0871, "step": 37160 }, { "epoch": 0.93, "learning_rate": 0.0015992261889807302, "loss": 0.0884, "step": 37170 }, { "epoch": 0.93, "learning_rate": 0.001598849332964852, "loss": 0.092, "step": 37180 }, { "epoch": 0.93, "learning_rate": 0.0015984724769489737, "loss": 0.0903, "step": 37190 }, { "epoch": 0.93, "learning_rate": 0.0015980956209330954, "loss": 0.0893, "step": 37200 }, { "epoch": 0.93, "learning_rate": 0.0015977187649172174, "loss": 0.0898, "step": 37210 }, { "epoch": 0.94, "learning_rate": 0.0015973419089013393, "loss": 0.0907, "step": 37220 }, { "epoch": 0.94, "learning_rate": 0.0015969650528854609, "loss": 0.0897, "step": 37230 }, { "epoch": 0.94, "learning_rate": 0.0015965881968695826, "loss": 0.0923, "step": 37240 }, { "epoch": 0.94, "learning_rate": 0.0015962113408537046, "loss": 0.0909, "step": 37250 }, { "epoch": 0.94, "learning_rate": 0.0015958344848378265, "loss": 0.0909, "step": 37260 }, { "epoch": 0.94, "learning_rate": 0.001595457628821948, "loss": 0.0874, "step": 37270 }, { "epoch": 0.94, "learning_rate": 0.0015950807728060698, "loss": 0.0862, "step": 37280 }, { "epoch": 0.94, "learning_rate": 0.0015947039167901918, "loss": 0.089, "step": 37290 }, { "epoch": 0.94, "learning_rate": 0.0015943270607743137, "loss": 0.0852, "step": 37300 }, { "epoch": 0.94, "learning_rate": 0.0015939502047584353, "loss": 0.0898, "step": 37310 }, { "epoch": 0.94, "learning_rate": 0.001593573348742557, "loss": 0.0906, "step": 37320 }, { "epoch": 0.94, "learning_rate": 0.001593196492726679, "loss": 0.0905, "step": 37330 }, { "epoch": 0.94, "learning_rate": 0.001592819636710801, "loss": 0.0873, "step": 37340 }, { "epoch": 0.94, "learning_rate": 0.0015924427806949225, "loss": 0.0883, "step": 37350 }, { "epoch": 0.94, "learning_rate": 0.0015920659246790444, "loss": 0.087, "step": 37360 }, { "epoch": 0.94, "learning_rate": 0.0015916890686631662, "loss": 0.0909, "step": 37370 }, { "epoch": 0.94, "learning_rate": 0.0015913122126472877, "loss": 0.0908, "step": 37380 }, { "epoch": 0.94, "learning_rate": 0.0015909353566314097, "loss": 0.0917, "step": 37390 }, { "epoch": 0.94, "learning_rate": 0.0015905585006155316, "loss": 0.0889, "step": 37400 }, { "epoch": 0.94, "learning_rate": 0.0015901816445996534, "loss": 0.0891, "step": 37410 }, { "epoch": 0.94, "learning_rate": 0.0015898047885837749, "loss": 0.0904, "step": 37420 }, { "epoch": 0.94, "learning_rate": 0.0015894279325678968, "loss": 0.0897, "step": 37430 }, { "epoch": 0.94, "learning_rate": 0.0015890510765520188, "loss": 0.0869, "step": 37440 }, { "epoch": 0.94, "learning_rate": 0.0015886742205361406, "loss": 0.0849, "step": 37450 }, { "epoch": 0.94, "learning_rate": 0.001588297364520262, "loss": 0.0891, "step": 37460 }, { "epoch": 0.94, "learning_rate": 0.001587920508504384, "loss": 0.0919, "step": 37470 }, { "epoch": 0.94, "learning_rate": 0.001587543652488506, "loss": 0.0893, "step": 37480 }, { "epoch": 0.94, "learning_rate": 0.0015871667964726277, "loss": 0.0892, "step": 37490 }, { "epoch": 0.94, "learning_rate": 0.0015867899404567495, "loss": 0.0905, "step": 37500 }, { "epoch": 0.94, "eval_cer": 0.6659635891505659, "eval_loss": 0.07065676897764206, "eval_runtime": 90.5606, "eval_samples_per_second": 110.412, "eval_steps_per_second": 6.901, "step": 37500 }, { "epoch": 0.94, "learning_rate": 0.0015864130844408712, "loss": 0.0874, "step": 37510 }, { "epoch": 0.94, "learning_rate": 0.0015860362284249932, "loss": 0.0857, "step": 37520 }, { "epoch": 0.94, "learning_rate": 0.0015856593724091152, "loss": 0.0874, "step": 37530 }, { "epoch": 0.94, "learning_rate": 0.0015852825163932367, "loss": 0.0898, "step": 37540 }, { "epoch": 0.94, "learning_rate": 0.0015849056603773584, "loss": 0.0887, "step": 37550 }, { "epoch": 0.94, "learning_rate": 0.0015845288043614804, "loss": 0.0885, "step": 37560 }, { "epoch": 0.94, "learning_rate": 0.0015841519483456024, "loss": 0.0867, "step": 37570 }, { "epoch": 0.94, "learning_rate": 0.0015837750923297239, "loss": 0.089, "step": 37580 }, { "epoch": 0.94, "learning_rate": 0.0015833982363138456, "loss": 0.0883, "step": 37590 }, { "epoch": 0.94, "learning_rate": 0.0015830213802979676, "loss": 0.0857, "step": 37600 }, { "epoch": 0.94, "learning_rate": 0.0015826445242820891, "loss": 0.0898, "step": 37610 }, { "epoch": 0.95, "learning_rate": 0.001582267668266211, "loss": 0.0881, "step": 37620 }, { "epoch": 0.95, "learning_rate": 0.001581890812250333, "loss": 0.0901, "step": 37630 }, { "epoch": 0.95, "learning_rate": 0.0015815139562344548, "loss": 0.0857, "step": 37640 }, { "epoch": 0.95, "learning_rate": 0.0015811371002185763, "loss": 0.0888, "step": 37650 }, { "epoch": 0.95, "learning_rate": 0.0015807602442026983, "loss": 0.093, "step": 37660 }, { "epoch": 0.95, "learning_rate": 0.0015803833881868202, "loss": 0.0835, "step": 37670 }, { "epoch": 0.95, "learning_rate": 0.001580006532170942, "loss": 0.0839, "step": 37680 }, { "epoch": 0.95, "learning_rate": 0.0015796296761550635, "loss": 0.0881, "step": 37690 }, { "epoch": 0.95, "learning_rate": 0.0015792528201391855, "loss": 0.0925, "step": 37700 }, { "epoch": 0.95, "learning_rate": 0.0015788759641233074, "loss": 0.0915, "step": 37710 }, { "epoch": 0.95, "learning_rate": 0.0015784991081074292, "loss": 0.0862, "step": 37720 }, { "epoch": 0.95, "learning_rate": 0.0015781222520915507, "loss": 0.0904, "step": 37730 }, { "epoch": 0.95, "learning_rate": 0.0015777453960756727, "loss": 0.0922, "step": 37740 }, { "epoch": 0.95, "learning_rate": 0.0015773685400597946, "loss": 0.0893, "step": 37750 }, { "epoch": 0.95, "learning_rate": 0.0015769916840439164, "loss": 0.0925, "step": 37760 }, { "epoch": 0.95, "learning_rate": 0.0015766148280280381, "loss": 0.0914, "step": 37770 }, { "epoch": 0.95, "learning_rate": 0.0015762379720121599, "loss": 0.0861, "step": 37780 }, { "epoch": 0.95, "learning_rate": 0.0015758611159962818, "loss": 0.09, "step": 37790 }, { "epoch": 0.95, "learning_rate": 0.0015754842599804038, "loss": 0.0869, "step": 37800 }, { "epoch": 0.95, "learning_rate": 0.0015751074039645253, "loss": 0.0865, "step": 37810 }, { "epoch": 0.95, "learning_rate": 0.001574730547948647, "loss": 0.0893, "step": 37820 }, { "epoch": 0.95, "learning_rate": 0.001574353691932769, "loss": 0.0851, "step": 37830 }, { "epoch": 0.95, "learning_rate": 0.0015739768359168905, "loss": 0.0882, "step": 37840 }, { "epoch": 0.95, "learning_rate": 0.0015735999799010125, "loss": 0.0886, "step": 37850 }, { "epoch": 0.95, "learning_rate": 0.0015732231238851343, "loss": 0.0908, "step": 37860 }, { "epoch": 0.95, "learning_rate": 0.0015728462678692562, "loss": 0.0871, "step": 37870 }, { "epoch": 0.95, "learning_rate": 0.0015724694118533777, "loss": 0.0869, "step": 37880 }, { "epoch": 0.95, "learning_rate": 0.0015720925558374997, "loss": 0.0918, "step": 37890 }, { "epoch": 0.95, "learning_rate": 0.0015717156998216214, "loss": 0.0886, "step": 37900 }, { "epoch": 0.95, "learning_rate": 0.0015713388438057434, "loss": 0.0904, "step": 37910 }, { "epoch": 0.95, "learning_rate": 0.001570961987789865, "loss": 0.0907, "step": 37920 }, { "epoch": 0.95, "learning_rate": 0.001570585131773987, "loss": 0.0886, "step": 37930 }, { "epoch": 0.95, "learning_rate": 0.0015702082757581089, "loss": 0.0878, "step": 37940 }, { "epoch": 0.95, "learning_rate": 0.0015698314197422306, "loss": 0.0868, "step": 37950 }, { "epoch": 0.95, "learning_rate": 0.0015694545637263521, "loss": 0.0882, "step": 37960 }, { "epoch": 0.95, "learning_rate": 0.001569077707710474, "loss": 0.0859, "step": 37970 }, { "epoch": 0.95, "learning_rate": 0.001568700851694596, "loss": 0.0885, "step": 37980 }, { "epoch": 0.95, "learning_rate": 0.0015683239956787178, "loss": 0.0905, "step": 37990 }, { "epoch": 0.95, "learning_rate": 0.0015679471396628393, "loss": 0.0881, "step": 38000 }, { "epoch": 0.95, "eval_cer": 0.6658206637417488, "eval_loss": 0.07003695517778397, "eval_runtime": 90.6769, "eval_samples_per_second": 110.271, "eval_steps_per_second": 6.893, "step": 38000 }, { "epoch": 0.95, "learning_rate": 0.0015675702836469613, "loss": 0.0887, "step": 38010 }, { "epoch": 0.96, "learning_rate": 0.0015671934276310832, "loss": 0.0889, "step": 38020 }, { "epoch": 0.96, "learning_rate": 0.001566816571615205, "loss": 0.0903, "step": 38030 }, { "epoch": 0.96, "learning_rate": 0.0015664397155993267, "loss": 0.0895, "step": 38040 }, { "epoch": 0.96, "learning_rate": 0.0015660628595834485, "loss": 0.0887, "step": 38050 }, { "epoch": 0.96, "learning_rate": 0.0015656860035675704, "loss": 0.0874, "step": 38060 }, { "epoch": 0.96, "learning_rate": 0.001565309147551692, "loss": 0.0902, "step": 38070 }, { "epoch": 0.96, "learning_rate": 0.001564932291535814, "loss": 0.0883, "step": 38080 }, { "epoch": 0.96, "learning_rate": 0.0015645554355199357, "loss": 0.0902, "step": 38090 }, { "epoch": 0.96, "learning_rate": 0.0015641785795040576, "loss": 0.0919, "step": 38100 }, { "epoch": 0.96, "learning_rate": 0.0015638017234881792, "loss": 0.0886, "step": 38110 }, { "epoch": 0.96, "learning_rate": 0.0015634248674723011, "loss": 0.089, "step": 38120 }, { "epoch": 0.96, "learning_rate": 0.0015630480114564229, "loss": 0.0936, "step": 38130 }, { "epoch": 0.96, "learning_rate": 0.0015626711554405448, "loss": 0.0878, "step": 38140 }, { "epoch": 0.96, "learning_rate": 0.0015622942994246664, "loss": 0.0909, "step": 38150 }, { "epoch": 0.96, "learning_rate": 0.0015619174434087883, "loss": 0.0903, "step": 38160 }, { "epoch": 0.96, "learning_rate": 0.00156154058739291, "loss": 0.084, "step": 38170 }, { "epoch": 0.96, "learning_rate": 0.001561163731377032, "loss": 0.0861, "step": 38180 }, { "epoch": 0.96, "learning_rate": 0.0015607868753611536, "loss": 0.0859, "step": 38190 }, { "epoch": 0.96, "learning_rate": 0.0015604100193452755, "loss": 0.0859, "step": 38200 }, { "epoch": 0.96, "learning_rate": 0.0015600331633293975, "loss": 0.0887, "step": 38210 }, { "epoch": 0.96, "learning_rate": 0.0015596563073135192, "loss": 0.0907, "step": 38220 }, { "epoch": 0.96, "learning_rate": 0.0015592794512976408, "loss": 0.0895, "step": 38230 }, { "epoch": 0.96, "learning_rate": 0.0015589025952817627, "loss": 0.0889, "step": 38240 }, { "epoch": 0.96, "learning_rate": 0.0015585257392658847, "loss": 0.0867, "step": 38250 }, { "epoch": 0.96, "learning_rate": 0.0015581488832500064, "loss": 0.0874, "step": 38260 }, { "epoch": 0.96, "learning_rate": 0.001557772027234128, "loss": 0.0905, "step": 38270 }, { "epoch": 0.96, "learning_rate": 0.00155739517121825, "loss": 0.0847, "step": 38280 }, { "epoch": 0.96, "learning_rate": 0.0015570183152023719, "loss": 0.0872, "step": 38290 }, { "epoch": 0.96, "learning_rate": 0.0015566414591864934, "loss": 0.0881, "step": 38300 }, { "epoch": 0.96, "learning_rate": 0.0015562646031706151, "loss": 0.0879, "step": 38310 }, { "epoch": 0.96, "learning_rate": 0.001555887747154737, "loss": 0.0908, "step": 38320 }, { "epoch": 0.96, "learning_rate": 0.001555510891138859, "loss": 0.0904, "step": 38330 }, { "epoch": 0.96, "learning_rate": 0.0015551340351229806, "loss": 0.0863, "step": 38340 }, { "epoch": 0.96, "learning_rate": 0.0015547571791071026, "loss": 0.0832, "step": 38350 }, { "epoch": 0.96, "learning_rate": 0.0015543803230912243, "loss": 0.0862, "step": 38360 }, { "epoch": 0.96, "learning_rate": 0.0015540034670753463, "loss": 0.0832, "step": 38370 }, { "epoch": 0.96, "learning_rate": 0.0015536266110594678, "loss": 0.0855, "step": 38380 }, { "epoch": 0.96, "learning_rate": 0.0015532497550435898, "loss": 0.0871, "step": 38390 }, { "epoch": 0.96, "learning_rate": 0.0015528728990277115, "loss": 0.0921, "step": 38400 }, { "epoch": 0.96, "learning_rate": 0.0015524960430118335, "loss": 0.0882, "step": 38410 }, { "epoch": 0.97, "learning_rate": 0.001552119186995955, "loss": 0.0872, "step": 38420 }, { "epoch": 0.97, "learning_rate": 0.001551742330980077, "loss": 0.0829, "step": 38430 }, { "epoch": 0.97, "learning_rate": 0.0015513654749641987, "loss": 0.0887, "step": 38440 }, { "epoch": 0.97, "learning_rate": 0.0015509886189483207, "loss": 0.0885, "step": 38450 }, { "epoch": 0.97, "learning_rate": 0.0015506117629324422, "loss": 0.088, "step": 38460 }, { "epoch": 0.97, "learning_rate": 0.0015502349069165641, "loss": 0.0894, "step": 38470 }, { "epoch": 0.97, "learning_rate": 0.0015498580509006859, "loss": 0.0892, "step": 38480 }, { "epoch": 0.97, "learning_rate": 0.0015494811948848078, "loss": 0.0859, "step": 38490 }, { "epoch": 0.97, "learning_rate": 0.0015491043388689294, "loss": 0.0858, "step": 38500 }, { "epoch": 0.97, "eval_cer": 0.6658187388204179, "eval_loss": 0.0693318322300911, "eval_runtime": 90.5702, "eval_samples_per_second": 110.401, "eval_steps_per_second": 6.901, "step": 38500 }, { "epoch": 0.97, "learning_rate": 0.0015487274828530513, "loss": 0.088, "step": 38510 }, { "epoch": 0.97, "learning_rate": 0.0015483506268371733, "loss": 0.0885, "step": 38520 }, { "epoch": 0.97, "learning_rate": 0.0015479737708212948, "loss": 0.0879, "step": 38530 }, { "epoch": 0.97, "learning_rate": 0.0015475969148054166, "loss": 0.0867, "step": 38540 }, { "epoch": 0.97, "learning_rate": 0.0015472200587895385, "loss": 0.0869, "step": 38550 }, { "epoch": 0.97, "learning_rate": 0.0015468432027736605, "loss": 0.0877, "step": 38560 }, { "epoch": 0.97, "learning_rate": 0.001546466346757782, "loss": 0.0886, "step": 38570 }, { "epoch": 0.97, "learning_rate": 0.0015460894907419038, "loss": 0.0855, "step": 38580 }, { "epoch": 0.97, "learning_rate": 0.0015457126347260257, "loss": 0.0903, "step": 38590 }, { "epoch": 0.97, "learning_rate": 0.0015453357787101477, "loss": 0.0868, "step": 38600 }, { "epoch": 0.97, "learning_rate": 0.0015449589226942692, "loss": 0.0871, "step": 38610 }, { "epoch": 0.97, "learning_rate": 0.0015445820666783912, "loss": 0.0901, "step": 38620 }, { "epoch": 0.97, "learning_rate": 0.001544205210662513, "loss": 0.0852, "step": 38630 }, { "epoch": 0.97, "learning_rate": 0.0015438283546466349, "loss": 0.0877, "step": 38640 }, { "epoch": 0.97, "learning_rate": 0.0015434514986307564, "loss": 0.0863, "step": 38650 }, { "epoch": 0.97, "learning_rate": 0.0015430746426148784, "loss": 0.0878, "step": 38660 }, { "epoch": 0.97, "learning_rate": 0.0015426977865990001, "loss": 0.0883, "step": 38670 }, { "epoch": 0.97, "learning_rate": 0.001542320930583122, "loss": 0.0878, "step": 38680 }, { "epoch": 0.97, "learning_rate": 0.0015419440745672436, "loss": 0.0835, "step": 38690 }, { "epoch": 0.97, "learning_rate": 0.0015415672185513656, "loss": 0.09, "step": 38700 }, { "epoch": 0.97, "learning_rate": 0.0015411903625354873, "loss": 0.087, "step": 38710 }, { "epoch": 0.97, "learning_rate": 0.0015408135065196088, "loss": 0.0869, "step": 38720 }, { "epoch": 0.97, "learning_rate": 0.0015404366505037308, "loss": 0.0866, "step": 38730 }, { "epoch": 0.97, "learning_rate": 0.0015400597944878528, "loss": 0.0861, "step": 38740 }, { "epoch": 0.97, "learning_rate": 0.0015396829384719745, "loss": 0.0859, "step": 38750 }, { "epoch": 0.97, "learning_rate": 0.0015393060824560963, "loss": 0.0833, "step": 38760 }, { "epoch": 0.97, "learning_rate": 0.001538929226440218, "loss": 0.0875, "step": 38770 }, { "epoch": 0.97, "learning_rate": 0.00153855237042434, "loss": 0.094, "step": 38780 }, { "epoch": 0.97, "learning_rate": 0.001538175514408462, "loss": 0.0892, "step": 38790 }, { "epoch": 0.97, "learning_rate": 0.0015377986583925835, "loss": 0.0866, "step": 38800 }, { "epoch": 0.98, "learning_rate": 0.0015374218023767052, "loss": 0.0841, "step": 38810 }, { "epoch": 0.98, "learning_rate": 0.0015370449463608272, "loss": 0.086, "step": 38820 }, { "epoch": 0.98, "learning_rate": 0.0015366680903449491, "loss": 0.0915, "step": 38830 }, { "epoch": 0.98, "learning_rate": 0.0015362912343290706, "loss": 0.0834, "step": 38840 }, { "epoch": 0.98, "learning_rate": 0.0015359143783131924, "loss": 0.0863, "step": 38850 }, { "epoch": 0.98, "learning_rate": 0.0015355375222973144, "loss": 0.0908, "step": 38860 }, { "epoch": 0.98, "learning_rate": 0.0015351606662814363, "loss": 0.0893, "step": 38870 }, { "epoch": 0.98, "learning_rate": 0.0015347838102655578, "loss": 0.0884, "step": 38880 }, { "epoch": 0.98, "learning_rate": 0.0015344069542496796, "loss": 0.091, "step": 38890 }, { "epoch": 0.98, "learning_rate": 0.0015340300982338015, "loss": 0.0845, "step": 38900 }, { "epoch": 0.98, "learning_rate": 0.0015336532422179235, "loss": 0.0864, "step": 38910 }, { "epoch": 0.98, "learning_rate": 0.001533276386202045, "loss": 0.0837, "step": 38920 }, { "epoch": 0.98, "learning_rate": 0.001532899530186167, "loss": 0.0895, "step": 38930 }, { "epoch": 0.98, "learning_rate": 0.0015325226741702887, "loss": 0.0854, "step": 38940 }, { "epoch": 0.98, "learning_rate": 0.0015321458181544103, "loss": 0.0863, "step": 38950 }, { "epoch": 0.98, "learning_rate": 0.0015317689621385322, "loss": 0.087, "step": 38960 }, { "epoch": 0.98, "learning_rate": 0.0015313921061226542, "loss": 0.0855, "step": 38970 }, { "epoch": 0.98, "learning_rate": 0.001531015250106776, "loss": 0.087, "step": 38980 }, { "epoch": 0.98, "learning_rate": 0.0015306383940908975, "loss": 0.0867, "step": 38990 }, { "epoch": 0.98, "learning_rate": 0.0015302615380750194, "loss": 0.0882, "step": 39000 }, { "epoch": 0.98, "eval_cer": 0.6656575266589574, "eval_loss": 0.06897370517253876, "eval_runtime": 90.71, "eval_samples_per_second": 110.23, "eval_steps_per_second": 6.89, "step": 39000 }, { "epoch": 0.98, "learning_rate": 0.0015298846820591414, "loss": 0.0879, "step": 39010 }, { "epoch": 0.98, "learning_rate": 0.0015295078260432631, "loss": 0.0867, "step": 39020 }, { "epoch": 0.98, "learning_rate": 0.0015291309700273849, "loss": 0.0872, "step": 39030 }, { "epoch": 0.98, "learning_rate": 0.0015287541140115066, "loss": 0.087, "step": 39040 }, { "epoch": 0.98, "learning_rate": 0.0015283772579956286, "loss": 0.0864, "step": 39050 }, { "epoch": 0.98, "learning_rate": 0.0015280004019797503, "loss": 0.089, "step": 39060 }, { "epoch": 0.98, "learning_rate": 0.001527623545963872, "loss": 0.0869, "step": 39070 }, { "epoch": 0.98, "learning_rate": 0.0015272466899479938, "loss": 0.0884, "step": 39080 }, { "epoch": 0.98, "learning_rate": 0.0015268698339321158, "loss": 0.0859, "step": 39090 }, { "epoch": 0.98, "learning_rate": 0.0015264929779162377, "loss": 0.0887, "step": 39100 }, { "epoch": 0.98, "learning_rate": 0.0015261161219003593, "loss": 0.0884, "step": 39110 }, { "epoch": 0.98, "learning_rate": 0.001525739265884481, "loss": 0.0872, "step": 39120 }, { "epoch": 0.98, "learning_rate": 0.001525362409868603, "loss": 0.0873, "step": 39130 }, { "epoch": 0.98, "learning_rate": 0.001524985553852725, "loss": 0.0838, "step": 39140 }, { "epoch": 0.98, "learning_rate": 0.0015246086978368465, "loss": 0.0855, "step": 39150 }, { "epoch": 0.98, "learning_rate": 0.0015242318418209682, "loss": 0.0864, "step": 39160 }, { "epoch": 0.98, "learning_rate": 0.0015238549858050902, "loss": 0.0874, "step": 39170 }, { "epoch": 0.98, "learning_rate": 0.0015234781297892117, "loss": 0.0882, "step": 39180 }, { "epoch": 0.98, "learning_rate": 0.0015231012737733337, "loss": 0.0869, "step": 39190 }, { "epoch": 0.98, "learning_rate": 0.0015227244177574556, "loss": 0.0886, "step": 39200 }, { "epoch": 0.99, "learning_rate": 0.0015223475617415774, "loss": 0.0848, "step": 39210 }, { "epoch": 0.99, "learning_rate": 0.001521970705725699, "loss": 0.0905, "step": 39220 }, { "epoch": 0.99, "learning_rate": 0.0015215938497098209, "loss": 0.0897, "step": 39230 }, { "epoch": 0.99, "learning_rate": 0.0015212169936939428, "loss": 0.0887, "step": 39240 }, { "epoch": 0.99, "learning_rate": 0.0015208401376780646, "loss": 0.0858, "step": 39250 }, { "epoch": 0.99, "learning_rate": 0.001520463281662186, "loss": 0.0861, "step": 39260 }, { "epoch": 0.99, "learning_rate": 0.001520086425646308, "loss": 0.0894, "step": 39270 }, { "epoch": 0.99, "learning_rate": 0.00151970956963043, "loss": 0.0888, "step": 39280 }, { "epoch": 0.99, "learning_rate": 0.0015193327136145518, "loss": 0.0865, "step": 39290 }, { "epoch": 0.99, "learning_rate": 0.0015189558575986733, "loss": 0.0905, "step": 39300 }, { "epoch": 0.99, "learning_rate": 0.0015185790015827952, "loss": 0.0842, "step": 39310 }, { "epoch": 0.99, "learning_rate": 0.0015182021455669172, "loss": 0.0872, "step": 39320 }, { "epoch": 0.99, "learning_rate": 0.001517825289551039, "loss": 0.09, "step": 39330 }, { "epoch": 0.99, "learning_rate": 0.0015174484335351607, "loss": 0.0873, "step": 39340 }, { "epoch": 0.99, "learning_rate": 0.0015170715775192824, "loss": 0.0859, "step": 39350 }, { "epoch": 0.99, "learning_rate": 0.0015166947215034044, "loss": 0.0847, "step": 39360 }, { "epoch": 0.99, "learning_rate": 0.0015163178654875264, "loss": 0.0879, "step": 39370 }, { "epoch": 0.99, "learning_rate": 0.001515941009471648, "loss": 0.0865, "step": 39380 }, { "epoch": 0.99, "learning_rate": 0.0015155641534557696, "loss": 0.0878, "step": 39390 }, { "epoch": 0.99, "learning_rate": 0.0015151872974398916, "loss": 0.0871, "step": 39400 }, { "epoch": 0.99, "learning_rate": 0.0015148104414240131, "loss": 0.0842, "step": 39410 }, { "epoch": 0.99, "learning_rate": 0.001514433585408135, "loss": 0.0883, "step": 39420 }, { "epoch": 0.99, "learning_rate": 0.0015140567293922568, "loss": 0.0833, "step": 39430 }, { "epoch": 0.99, "learning_rate": 0.0015136798733763788, "loss": 0.0864, "step": 39440 }, { "epoch": 0.99, "learning_rate": 0.0015133030173605003, "loss": 0.0888, "step": 39450 }, { "epoch": 0.99, "learning_rate": 0.0015129261613446223, "loss": 0.0835, "step": 39460 }, { "epoch": 0.99, "learning_rate": 0.001512549305328744, "loss": 0.0861, "step": 39470 }, { "epoch": 0.99, "learning_rate": 0.001512172449312866, "loss": 0.086, "step": 39480 }, { "epoch": 0.99, "learning_rate": 0.0015117955932969875, "loss": 0.085, "step": 39490 }, { "epoch": 0.99, "learning_rate": 0.0015114187372811095, "loss": 0.0858, "step": 39500 }, { "epoch": 0.99, "eval_cer": 0.6655954479460368, "eval_loss": 0.06882914155721664, "eval_runtime": 90.5569, "eval_samples_per_second": 110.417, "eval_steps_per_second": 6.902, "step": 39500 }, { "epoch": 0.99, "learning_rate": 0.0015110418812652314, "loss": 0.0906, "step": 39510 }, { "epoch": 0.99, "learning_rate": 0.0015106650252493532, "loss": 0.0863, "step": 39520 }, { "epoch": 0.99, "learning_rate": 0.0015102881692334747, "loss": 0.0858, "step": 39530 }, { "epoch": 0.99, "learning_rate": 0.0015099113132175967, "loss": 0.0859, "step": 39540 }, { "epoch": 0.99, "learning_rate": 0.0015095344572017186, "loss": 0.0843, "step": 39550 }, { "epoch": 0.99, "learning_rate": 0.0015091576011858404, "loss": 0.085, "step": 39560 }, { "epoch": 0.99, "learning_rate": 0.001508780745169962, "loss": 0.0908, "step": 39570 }, { "epoch": 0.99, "learning_rate": 0.0015084038891540839, "loss": 0.0845, "step": 39580 }, { "epoch": 0.99, "learning_rate": 0.0015080270331382058, "loss": 0.0847, "step": 39590 }, { "epoch": 0.99, "learning_rate": 0.0015076501771223276, "loss": 0.0871, "step": 39600 }, { "epoch": 1.0, "learning_rate": 0.0015072733211064493, "loss": 0.0857, "step": 39610 }, { "epoch": 1.0, "learning_rate": 0.001506896465090571, "loss": 0.0874, "step": 39620 }, { "epoch": 1.0, "learning_rate": 0.001506519609074693, "loss": 0.0863, "step": 39630 }, { "epoch": 1.0, "learning_rate": 0.0015061427530588146, "loss": 0.0854, "step": 39640 }, { "epoch": 1.0, "learning_rate": 0.0015057658970429365, "loss": 0.0858, "step": 39650 }, { "epoch": 1.0, "learning_rate": 0.0015053890410270583, "loss": 0.0907, "step": 39660 }, { "epoch": 1.0, "learning_rate": 0.0015050121850111802, "loss": 0.0882, "step": 39670 }, { "epoch": 1.0, "learning_rate": 0.0015046353289953017, "loss": 0.0859, "step": 39680 }, { "epoch": 1.0, "learning_rate": 0.0015042584729794237, "loss": 0.0833, "step": 39690 }, { "epoch": 1.0, "learning_rate": 0.0015038816169635455, "loss": 0.0846, "step": 39700 }, { "epoch": 1.0, "learning_rate": 0.0015035047609476674, "loss": 0.0839, "step": 39710 }, { "epoch": 1.0, "learning_rate": 0.001503127904931789, "loss": 0.0852, "step": 39720 }, { "epoch": 1.0, "learning_rate": 0.001502751048915911, "loss": 0.0892, "step": 39730 }, { "epoch": 1.0, "learning_rate": 0.0015023741929000326, "loss": 0.0885, "step": 39740 }, { "epoch": 1.0, "learning_rate": 0.0015019973368841546, "loss": 0.0857, "step": 39750 }, { "epoch": 1.0, "learning_rate": 0.0015016204808682761, "loss": 0.0866, "step": 39760 }, { "epoch": 1.0, "learning_rate": 0.001501243624852398, "loss": 0.0869, "step": 39770 }, { "epoch": 1.0, "learning_rate": 0.00150086676883652, "loss": 0.0851, "step": 39780 }, { "epoch": 1.0, "learning_rate": 0.0015004899128206418, "loss": 0.0851, "step": 39790 }, { "epoch": 1.0, "learning_rate": 0.0015001130568047633, "loss": 0.0856, "step": 39800 }, { "epoch": 1.0, "learning_rate": 0.0014997362007888853, "loss": 0.0823, "step": 39810 }, { "epoch": 1.0, "learning_rate": 0.0014993593447730073, "loss": 0.0843, "step": 39820 }, { "epoch": 1.0, "learning_rate": 0.0014989824887571288, "loss": 0.0779, "step": 39830 }, { "epoch": 1.0, "learning_rate": 0.0014986056327412505, "loss": 0.0803, "step": 39840 }, { "epoch": 1.0, "learning_rate": 0.0014982287767253725, "loss": 0.0808, "step": 39850 }, { "epoch": 1.0, "learning_rate": 0.0014978519207094942, "loss": 0.0836, "step": 39860 }, { "epoch": 1.0, "learning_rate": 0.0014974750646936162, "loss": 0.0778, "step": 39870 }, { "epoch": 1.0, "learning_rate": 0.0014970982086777377, "loss": 0.0786, "step": 39880 }, { "epoch": 1.0, "learning_rate": 0.0014967213526618597, "loss": 0.0768, "step": 39890 }, { "epoch": 1.0, "learning_rate": 0.0014963444966459814, "loss": 0.0819, "step": 39900 }, { "epoch": 1.0, "learning_rate": 0.0014959676406301034, "loss": 0.0801, "step": 39910 }, { "epoch": 1.0, "learning_rate": 0.0014955907846142251, "loss": 0.0788, "step": 39920 }, { "epoch": 1.0, "learning_rate": 0.0014952139285983469, "loss": 0.0818, "step": 39930 }, { "epoch": 1.0, "learning_rate": 0.0014948370725824686, "loss": 0.0809, "step": 39940 }, { "epoch": 1.0, "learning_rate": 0.0014944602165665906, "loss": 0.0779, "step": 39950 }, { "epoch": 1.0, "learning_rate": 0.0014940833605507123, "loss": 0.0791, "step": 39960 }, { "epoch": 1.0, "learning_rate": 0.001493706504534834, "loss": 0.0792, "step": 39970 }, { "epoch": 1.0, "learning_rate": 0.0014933296485189558, "loss": 0.0761, "step": 39980 }, { "epoch": 1.0, "learning_rate": 0.0014929527925030778, "loss": 0.0779, "step": 39990 }, { "epoch": 1.0, "learning_rate": 0.0014925759364871995, "loss": 0.0808, "step": 40000 }, { "epoch": 1.0, "eval_cer": 0.665779277933135, "eval_loss": 0.06800606101751328, "eval_runtime": 90.8369, "eval_samples_per_second": 110.076, "eval_steps_per_second": 6.88, "step": 40000 }, { "epoch": 1.01, "learning_rate": 0.0014921990804713213, "loss": 0.0828, "step": 40010 }, { "epoch": 1.01, "learning_rate": 0.001491822224455443, "loss": 0.0771, "step": 40020 }, { "epoch": 1.01, "learning_rate": 0.001491445368439565, "loss": 0.0794, "step": 40030 }, { "epoch": 1.01, "learning_rate": 0.0014910685124236867, "loss": 0.0812, "step": 40040 }, { "epoch": 1.01, "learning_rate": 0.0014906916564078085, "loss": 0.0781, "step": 40050 }, { "epoch": 1.01, "learning_rate": 0.0014903148003919302, "loss": 0.0791, "step": 40060 }, { "epoch": 1.01, "learning_rate": 0.001489937944376052, "loss": 0.0773, "step": 40070 }, { "epoch": 1.01, "learning_rate": 0.001489561088360174, "loss": 0.0797, "step": 40080 }, { "epoch": 1.01, "learning_rate": 0.0014891842323442957, "loss": 0.08, "step": 40090 }, { "epoch": 1.01, "learning_rate": 0.0014888073763284174, "loss": 0.0774, "step": 40100 }, { "epoch": 1.01, "learning_rate": 0.0014884305203125392, "loss": 0.08, "step": 40110 }, { "epoch": 1.01, "learning_rate": 0.0014880536642966611, "loss": 0.0746, "step": 40120 }, { "epoch": 1.01, "learning_rate": 0.0014876768082807829, "loss": 0.0809, "step": 40130 }, { "epoch": 1.01, "learning_rate": 0.0014872999522649048, "loss": 0.0798, "step": 40140 }, { "epoch": 1.01, "learning_rate": 0.0014869230962490263, "loss": 0.0806, "step": 40150 }, { "epoch": 1.01, "learning_rate": 0.0014865462402331483, "loss": 0.079, "step": 40160 }, { "epoch": 1.01, "learning_rate": 0.00148616938421727, "loss": 0.076, "step": 40170 }, { "epoch": 1.01, "learning_rate": 0.001485792528201392, "loss": 0.0816, "step": 40180 }, { "epoch": 1.01, "learning_rate": 0.0014854156721855138, "loss": 0.0786, "step": 40190 }, { "epoch": 1.01, "learning_rate": 0.0014850388161696355, "loss": 0.0837, "step": 40200 }, { "epoch": 1.01, "learning_rate": 0.0014846619601537572, "loss": 0.0779, "step": 40210 }, { "epoch": 1.01, "learning_rate": 0.0014842851041378792, "loss": 0.0775, "step": 40220 }, { "epoch": 1.01, "learning_rate": 0.001483908248122001, "loss": 0.0786, "step": 40230 }, { "epoch": 1.01, "learning_rate": 0.0014835313921061227, "loss": 0.0826, "step": 40240 }, { "epoch": 1.01, "learning_rate": 0.0014831545360902444, "loss": 0.0794, "step": 40250 }, { "epoch": 1.01, "learning_rate": 0.0014827776800743664, "loss": 0.082, "step": 40260 }, { "epoch": 1.01, "learning_rate": 0.0014824008240584882, "loss": 0.0801, "step": 40270 }, { "epoch": 1.01, "learning_rate": 0.00148202396804261, "loss": 0.0795, "step": 40280 }, { "epoch": 1.01, "learning_rate": 0.0014816471120267316, "loss": 0.0793, "step": 40290 }, { "epoch": 1.01, "learning_rate": 0.0014812702560108534, "loss": 0.0812, "step": 40300 }, { "epoch": 1.01, "learning_rate": 0.0014808933999949753, "loss": 0.0786, "step": 40310 }, { "epoch": 1.01, "learning_rate": 0.001480516543979097, "loss": 0.0835, "step": 40320 }, { "epoch": 1.01, "learning_rate": 0.0014801396879632188, "loss": 0.0803, "step": 40330 }, { "epoch": 1.01, "learning_rate": 0.0014797628319473406, "loss": 0.0768, "step": 40340 }, { "epoch": 1.01, "learning_rate": 0.0014793859759314625, "loss": 0.0818, "step": 40350 }, { "epoch": 1.01, "learning_rate": 0.0014790091199155843, "loss": 0.0765, "step": 40360 }, { "epoch": 1.01, "learning_rate": 0.001478632263899706, "loss": 0.0779, "step": 40370 }, { "epoch": 1.01, "learning_rate": 0.0014782554078838278, "loss": 0.0835, "step": 40380 }, { "epoch": 1.01, "learning_rate": 0.0014778785518679497, "loss": 0.0762, "step": 40390 }, { "epoch": 1.01, "learning_rate": 0.0014775016958520715, "loss": 0.079, "step": 40400 }, { "epoch": 1.02, "learning_rate": 0.0014771248398361934, "loss": 0.0802, "step": 40410 }, { "epoch": 1.02, "learning_rate": 0.001476747983820315, "loss": 0.083, "step": 40420 }, { "epoch": 1.02, "learning_rate": 0.001476371127804437, "loss": 0.0782, "step": 40430 }, { "epoch": 1.02, "learning_rate": 0.0014759942717885587, "loss": 0.0779, "step": 40440 }, { "epoch": 1.02, "learning_rate": 0.0014756174157726806, "loss": 0.0753, "step": 40450 }, { "epoch": 1.02, "learning_rate": 0.0014752405597568022, "loss": 0.0799, "step": 40460 }, { "epoch": 1.02, "learning_rate": 0.0014748637037409241, "loss": 0.0807, "step": 40470 }, { "epoch": 1.02, "learning_rate": 0.0014744868477250459, "loss": 0.0781, "step": 40480 }, { "epoch": 1.02, "learning_rate": 0.0014741099917091678, "loss": 0.0815, "step": 40490 }, { "epoch": 1.02, "learning_rate": 0.0014737331356932896, "loss": 0.0783, "step": 40500 }, { "epoch": 1.02, "eval_cer": 0.6657051684618964, "eval_loss": 0.06801352649927139, "eval_runtime": 90.9119, "eval_samples_per_second": 109.986, "eval_steps_per_second": 6.875, "step": 40500 }, { "epoch": 1.02, "learning_rate": 0.001473356279677411, "loss": 0.0779, "step": 40510 }, { "epoch": 1.02, "learning_rate": 0.001472979423661533, "loss": 0.0833, "step": 40520 }, { "epoch": 1.02, "learning_rate": 0.0014726025676456548, "loss": 0.0778, "step": 40530 }, { "epoch": 1.02, "learning_rate": 0.0014722257116297768, "loss": 0.084, "step": 40540 }, { "epoch": 1.02, "learning_rate": 0.0014718488556138985, "loss": 0.0814, "step": 40550 }, { "epoch": 1.02, "learning_rate": 0.0014714719995980203, "loss": 0.0806, "step": 40560 }, { "epoch": 1.02, "learning_rate": 0.001471095143582142, "loss": 0.0788, "step": 40570 }, { "epoch": 1.02, "learning_rate": 0.001470718287566264, "loss": 0.0822, "step": 40580 }, { "epoch": 1.02, "learning_rate": 0.0014703414315503857, "loss": 0.0778, "step": 40590 }, { "epoch": 1.02, "learning_rate": 0.0014699645755345075, "loss": 0.0771, "step": 40600 }, { "epoch": 1.02, "learning_rate": 0.0014695877195186292, "loss": 0.0766, "step": 40610 }, { "epoch": 1.02, "learning_rate": 0.0014692108635027512, "loss": 0.078, "step": 40620 }, { "epoch": 1.02, "learning_rate": 0.001468834007486873, "loss": 0.0759, "step": 40630 }, { "epoch": 1.02, "learning_rate": 0.0014684571514709947, "loss": 0.0787, "step": 40640 }, { "epoch": 1.02, "learning_rate": 0.0014680802954551164, "loss": 0.0778, "step": 40650 }, { "epoch": 1.02, "learning_rate": 0.0014677034394392384, "loss": 0.08, "step": 40660 }, { "epoch": 1.02, "learning_rate": 0.00146732658342336, "loss": 0.0763, "step": 40670 }, { "epoch": 1.02, "learning_rate": 0.0014669497274074818, "loss": 0.0784, "step": 40680 }, { "epoch": 1.02, "learning_rate": 0.0014665728713916036, "loss": 0.0786, "step": 40690 }, { "epoch": 1.02, "learning_rate": 0.0014661960153757256, "loss": 0.0769, "step": 40700 }, { "epoch": 1.02, "learning_rate": 0.0014658191593598473, "loss": 0.0787, "step": 40710 }, { "epoch": 1.02, "learning_rate": 0.001465442303343969, "loss": 0.0813, "step": 40720 }, { "epoch": 1.02, "learning_rate": 0.0014650654473280908, "loss": 0.0807, "step": 40730 }, { "epoch": 1.02, "learning_rate": 0.0014646885913122125, "loss": 0.0771, "step": 40740 }, { "epoch": 1.02, "learning_rate": 0.0014643117352963345, "loss": 0.0796, "step": 40750 }, { "epoch": 1.02, "learning_rate": 0.0014639348792804562, "loss": 0.078, "step": 40760 }, { "epoch": 1.02, "learning_rate": 0.0014635580232645782, "loss": 0.0757, "step": 40770 }, { "epoch": 1.02, "learning_rate": 0.0014631811672486997, "loss": 0.0785, "step": 40780 }, { "epoch": 1.02, "learning_rate": 0.0014628043112328217, "loss": 0.0792, "step": 40790 }, { "epoch": 1.03, "learning_rate": 0.0014624274552169434, "loss": 0.0769, "step": 40800 }, { "epoch": 1.03, "learning_rate": 0.0014620505992010654, "loss": 0.0819, "step": 40810 }, { "epoch": 1.03, "learning_rate": 0.0014616737431851871, "loss": 0.0815, "step": 40820 }, { "epoch": 1.03, "learning_rate": 0.0014612968871693089, "loss": 0.0788, "step": 40830 }, { "epoch": 1.03, "learning_rate": 0.0014609200311534306, "loss": 0.0764, "step": 40840 }, { "epoch": 1.03, "learning_rate": 0.0014605431751375526, "loss": 0.0775, "step": 40850 }, { "epoch": 1.03, "learning_rate": 0.0014601663191216743, "loss": 0.0845, "step": 40860 }, { "epoch": 1.03, "learning_rate": 0.001459789463105796, "loss": 0.0789, "step": 40870 }, { "epoch": 1.03, "learning_rate": 0.0014594126070899178, "loss": 0.0779, "step": 40880 }, { "epoch": 1.03, "learning_rate": 0.0014590357510740398, "loss": 0.0803, "step": 40890 }, { "epoch": 1.03, "learning_rate": 0.0014586588950581615, "loss": 0.0782, "step": 40900 }, { "epoch": 1.03, "learning_rate": 0.0014582820390422833, "loss": 0.0785, "step": 40910 }, { "epoch": 1.03, "learning_rate": 0.001457905183026405, "loss": 0.075, "step": 40920 }, { "epoch": 1.03, "learning_rate": 0.001457528327010527, "loss": 0.0831, "step": 40930 }, { "epoch": 1.03, "learning_rate": 0.0014571514709946487, "loss": 0.0776, "step": 40940 }, { "epoch": 1.03, "learning_rate": 0.0014567746149787705, "loss": 0.0794, "step": 40950 }, { "epoch": 1.03, "learning_rate": 0.0014563977589628922, "loss": 0.0811, "step": 40960 }, { "epoch": 1.03, "learning_rate": 0.001456020902947014, "loss": 0.0832, "step": 40970 }, { "epoch": 1.03, "learning_rate": 0.001455644046931136, "loss": 0.0818, "step": 40980 }, { "epoch": 1.03, "learning_rate": 0.0014552671909152577, "loss": 0.0833, "step": 40990 }, { "epoch": 1.03, "learning_rate": 0.0014548903348993794, "loss": 0.0822, "step": 41000 }, { "epoch": 1.03, "eval_cer": 0.6657999708374418, "eval_loss": 0.06757137924432755, "eval_runtime": 90.6292, "eval_samples_per_second": 110.329, "eval_steps_per_second": 6.896, "step": 41000 }, { "epoch": 1.03, "learning_rate": 0.0014545134788835012, "loss": 0.0816, "step": 41010 }, { "epoch": 1.03, "learning_rate": 0.0014541366228676231, "loss": 0.0803, "step": 41020 }, { "epoch": 1.03, "learning_rate": 0.0014537597668517449, "loss": 0.0761, "step": 41030 }, { "epoch": 1.03, "learning_rate": 0.0014533829108358666, "loss": 0.078, "step": 41040 }, { "epoch": 1.03, "learning_rate": 0.0014530060548199884, "loss": 0.0806, "step": 41050 }, { "epoch": 1.03, "learning_rate": 0.0014526291988041103, "loss": 0.0779, "step": 41060 }, { "epoch": 1.03, "learning_rate": 0.001452252342788232, "loss": 0.079, "step": 41070 }, { "epoch": 1.03, "learning_rate": 0.001451875486772354, "loss": 0.0778, "step": 41080 }, { "epoch": 1.03, "learning_rate": 0.0014514986307564755, "loss": 0.0755, "step": 41090 }, { "epoch": 1.03, "learning_rate": 0.0014511217747405975, "loss": 0.0805, "step": 41100 }, { "epoch": 1.03, "learning_rate": 0.0014507449187247193, "loss": 0.0765, "step": 41110 }, { "epoch": 1.03, "learning_rate": 0.0014503680627088412, "loss": 0.0777, "step": 41120 }, { "epoch": 1.03, "learning_rate": 0.001449991206692963, "loss": 0.0769, "step": 41130 }, { "epoch": 1.03, "learning_rate": 0.0014496143506770847, "loss": 0.0806, "step": 41140 }, { "epoch": 1.03, "learning_rate": 0.0014492374946612064, "loss": 0.0801, "step": 41150 }, { "epoch": 1.03, "learning_rate": 0.0014488606386453284, "loss": 0.0802, "step": 41160 }, { "epoch": 1.03, "learning_rate": 0.0014484837826294502, "loss": 0.0785, "step": 41170 }, { "epoch": 1.03, "learning_rate": 0.001448106926613572, "loss": 0.077, "step": 41180 }, { "epoch": 1.03, "learning_rate": 0.0014477300705976936, "loss": 0.0786, "step": 41190 }, { "epoch": 1.04, "learning_rate": 0.0014473532145818154, "loss": 0.0783, "step": 41200 }, { "epoch": 1.04, "learning_rate": 0.0014469763585659373, "loss": 0.0784, "step": 41210 }, { "epoch": 1.04, "learning_rate": 0.001446599502550059, "loss": 0.0782, "step": 41220 }, { "epoch": 1.04, "learning_rate": 0.0014462226465341808, "loss": 0.0773, "step": 41230 }, { "epoch": 1.04, "learning_rate": 0.0014458457905183026, "loss": 0.0797, "step": 41240 }, { "epoch": 1.04, "learning_rate": 0.0014454689345024245, "loss": 0.0812, "step": 41250 }, { "epoch": 1.04, "learning_rate": 0.0014450920784865463, "loss": 0.0825, "step": 41260 }, { "epoch": 1.04, "learning_rate": 0.001444715222470668, "loss": 0.0816, "step": 41270 }, { "epoch": 1.04, "learning_rate": 0.0014443383664547898, "loss": 0.0763, "step": 41280 }, { "epoch": 1.04, "learning_rate": 0.0014439615104389117, "loss": 0.0787, "step": 41290 }, { "epoch": 1.04, "learning_rate": 0.0014435846544230335, "loss": 0.0757, "step": 41300 }, { "epoch": 1.04, "learning_rate": 0.0014432077984071552, "loss": 0.0786, "step": 41310 }, { "epoch": 1.04, "learning_rate": 0.001442830942391277, "loss": 0.0764, "step": 41320 }, { "epoch": 1.04, "learning_rate": 0.001442454086375399, "loss": 0.0757, "step": 41330 }, { "epoch": 1.04, "learning_rate": 0.0014420772303595207, "loss": 0.0774, "step": 41340 }, { "epoch": 1.04, "learning_rate": 0.0014417003743436426, "loss": 0.0795, "step": 41350 }, { "epoch": 1.04, "learning_rate": 0.0014413235183277642, "loss": 0.0795, "step": 41360 }, { "epoch": 1.04, "learning_rate": 0.0014409466623118861, "loss": 0.0797, "step": 41370 }, { "epoch": 1.04, "learning_rate": 0.0014405698062960079, "loss": 0.0804, "step": 41380 }, { "epoch": 1.04, "learning_rate": 0.0014401929502801296, "loss": 0.0768, "step": 41390 }, { "epoch": 1.04, "learning_rate": 0.0014398160942642516, "loss": 0.0795, "step": 41400 }, { "epoch": 1.04, "learning_rate": 0.0014394392382483731, "loss": 0.0789, "step": 41410 }, { "epoch": 1.04, "learning_rate": 0.001439062382232495, "loss": 0.0791, "step": 41420 }, { "epoch": 1.04, "learning_rate": 0.0014386855262166168, "loss": 0.0811, "step": 41430 }, { "epoch": 1.04, "learning_rate": 0.0014383086702007388, "loss": 0.0755, "step": 41440 }, { "epoch": 1.04, "learning_rate": 0.0014379318141848603, "loss": 0.0772, "step": 41450 }, { "epoch": 1.04, "learning_rate": 0.0014375549581689823, "loss": 0.0828, "step": 41460 }, { "epoch": 1.04, "learning_rate": 0.001437178102153104, "loss": 0.082, "step": 41470 }, { "epoch": 1.04, "learning_rate": 0.001436801246137226, "loss": 0.0757, "step": 41480 }, { "epoch": 1.04, "learning_rate": 0.0014364243901213477, "loss": 0.0775, "step": 41490 }, { "epoch": 1.04, "learning_rate": 0.0014360475341054695, "loss": 0.077, "step": 41500 }, { "epoch": 1.04, "eval_cer": 0.6657475167311756, "eval_loss": 0.0675220713019371, "eval_runtime": 90.5271, "eval_samples_per_second": 110.453, "eval_steps_per_second": 6.904, "step": 41500 }, { "epoch": 1.04, "learning_rate": 0.0014356706780895912, "loss": 0.0812, "step": 41510 }, { "epoch": 1.04, "learning_rate": 0.0014352938220737132, "loss": 0.08, "step": 41520 }, { "epoch": 1.04, "learning_rate": 0.001434916966057835, "loss": 0.0765, "step": 41530 }, { "epoch": 1.04, "learning_rate": 0.0014345401100419567, "loss": 0.0768, "step": 41540 }, { "epoch": 1.04, "learning_rate": 0.0014341632540260784, "loss": 0.0788, "step": 41550 }, { "epoch": 1.04, "learning_rate": 0.0014337863980102004, "loss": 0.0817, "step": 41560 }, { "epoch": 1.04, "learning_rate": 0.001433409541994322, "loss": 0.0797, "step": 41570 }, { "epoch": 1.04, "learning_rate": 0.0014330326859784439, "loss": 0.0807, "step": 41580 }, { "epoch": 1.04, "learning_rate": 0.0014326558299625656, "loss": 0.0763, "step": 41590 }, { "epoch": 1.05, "learning_rate": 0.0014322789739466876, "loss": 0.0777, "step": 41600 }, { "epoch": 1.05, "learning_rate": 0.0014319021179308093, "loss": 0.0768, "step": 41610 }, { "epoch": 1.05, "learning_rate": 0.001431525261914931, "loss": 0.0784, "step": 41620 }, { "epoch": 1.05, "learning_rate": 0.0014311484058990528, "loss": 0.0775, "step": 41630 }, { "epoch": 1.05, "learning_rate": 0.0014307715498831745, "loss": 0.0798, "step": 41640 }, { "epoch": 1.05, "learning_rate": 0.0014303946938672965, "loss": 0.0781, "step": 41650 }, { "epoch": 1.05, "learning_rate": 0.0014300178378514182, "loss": 0.0787, "step": 41660 }, { "epoch": 1.05, "learning_rate": 0.00142964098183554, "loss": 0.0804, "step": 41670 }, { "epoch": 1.05, "learning_rate": 0.0014292641258196617, "loss": 0.0802, "step": 41680 }, { "epoch": 1.05, "learning_rate": 0.0014288872698037837, "loss": 0.0798, "step": 41690 }, { "epoch": 1.05, "learning_rate": 0.0014285104137879054, "loss": 0.0786, "step": 41700 }, { "epoch": 1.05, "learning_rate": 0.0014281335577720274, "loss": 0.0798, "step": 41710 }, { "epoch": 1.05, "learning_rate": 0.001427756701756149, "loss": 0.0793, "step": 41720 }, { "epoch": 1.05, "learning_rate": 0.0014273798457402709, "loss": 0.08, "step": 41730 }, { "epoch": 1.05, "learning_rate": 0.0014270029897243926, "loss": 0.0793, "step": 41740 }, { "epoch": 1.05, "learning_rate": 0.0014266261337085146, "loss": 0.0795, "step": 41750 }, { "epoch": 1.05, "learning_rate": 0.0014262492776926363, "loss": 0.0796, "step": 41760 }, { "epoch": 1.05, "learning_rate": 0.001425872421676758, "loss": 0.0833, "step": 41770 }, { "epoch": 1.05, "learning_rate": 0.0014254955656608798, "loss": 0.0808, "step": 41780 }, { "epoch": 1.05, "learning_rate": 0.0014251187096450018, "loss": 0.0769, "step": 41790 }, { "epoch": 1.05, "learning_rate": 0.0014247418536291235, "loss": 0.0781, "step": 41800 }, { "epoch": 1.05, "learning_rate": 0.0014243649976132453, "loss": 0.0753, "step": 41810 }, { "epoch": 1.05, "learning_rate": 0.001423988141597367, "loss": 0.0789, "step": 41820 }, { "epoch": 1.05, "learning_rate": 0.0014236112855814888, "loss": 0.078, "step": 41830 }, { "epoch": 1.05, "learning_rate": 0.0014232344295656107, "loss": 0.0754, "step": 41840 }, { "epoch": 1.05, "learning_rate": 0.0014228575735497325, "loss": 0.0766, "step": 41850 }, { "epoch": 1.05, "learning_rate": 0.0014224807175338542, "loss": 0.0749, "step": 41860 }, { "epoch": 1.05, "learning_rate": 0.001422103861517976, "loss": 0.0807, "step": 41870 }, { "epoch": 1.05, "learning_rate": 0.001421727005502098, "loss": 0.0805, "step": 41880 }, { "epoch": 1.05, "learning_rate": 0.0014213501494862197, "loss": 0.0793, "step": 41890 }, { "epoch": 1.05, "learning_rate": 0.0014209732934703414, "loss": 0.0769, "step": 41900 }, { "epoch": 1.05, "learning_rate": 0.0014205964374544632, "loss": 0.082, "step": 41910 }, { "epoch": 1.05, "learning_rate": 0.0014202195814385851, "loss": 0.0765, "step": 41920 }, { "epoch": 1.05, "learning_rate": 0.0014198427254227069, "loss": 0.0783, "step": 41930 }, { "epoch": 1.05, "learning_rate": 0.0014194658694068286, "loss": 0.0794, "step": 41940 }, { "epoch": 1.05, "learning_rate": 0.0014190890133909504, "loss": 0.0765, "step": 41950 }, { "epoch": 1.05, "learning_rate": 0.0014187121573750723, "loss": 0.0785, "step": 41960 }, { "epoch": 1.05, "learning_rate": 0.001418335301359194, "loss": 0.0787, "step": 41970 }, { "epoch": 1.05, "learning_rate": 0.001417958445343316, "loss": 0.0797, "step": 41980 }, { "epoch": 1.05, "learning_rate": 0.0014175815893274376, "loss": 0.0779, "step": 41990 }, { "epoch": 1.06, "learning_rate": 0.0014172047333115595, "loss": 0.0788, "step": 42000 }, { "epoch": 1.06, "eval_cer": 0.6654881335818407, "eval_loss": 0.06726432591676712, "eval_runtime": 90.7258, "eval_samples_per_second": 110.211, "eval_steps_per_second": 6.889, "step": 42000 }, { "epoch": 1.06, "learning_rate": 0.0014168278772956813, "loss": 0.0801, "step": 42010 }, { "epoch": 1.06, "learning_rate": 0.0014164510212798032, "loss": 0.0776, "step": 42020 }, { "epoch": 1.06, "learning_rate": 0.0014160741652639247, "loss": 0.0782, "step": 42030 }, { "epoch": 1.06, "learning_rate": 0.0014156973092480467, "loss": 0.0778, "step": 42040 }, { "epoch": 1.06, "learning_rate": 0.0014153204532321685, "loss": 0.0781, "step": 42050 }, { "epoch": 1.06, "learning_rate": 0.0014149435972162902, "loss": 0.0793, "step": 42060 }, { "epoch": 1.06, "learning_rate": 0.0014145667412004122, "loss": 0.0788, "step": 42070 }, { "epoch": 1.06, "learning_rate": 0.0014141898851845337, "loss": 0.0792, "step": 42080 }, { "epoch": 1.06, "learning_rate": 0.0014138130291686556, "loss": 0.0779, "step": 42090 }, { "epoch": 1.06, "learning_rate": 0.0014134361731527774, "loss": 0.082, "step": 42100 }, { "epoch": 1.06, "learning_rate": 0.0014130593171368994, "loss": 0.0783, "step": 42110 }, { "epoch": 1.06, "learning_rate": 0.001412682461121021, "loss": 0.0751, "step": 42120 }, { "epoch": 1.06, "learning_rate": 0.0014123056051051428, "loss": 0.0807, "step": 42130 }, { "epoch": 1.06, "learning_rate": 0.0014119287490892646, "loss": 0.0753, "step": 42140 }, { "epoch": 1.06, "learning_rate": 0.0014115518930733865, "loss": 0.0764, "step": 42150 }, { "epoch": 1.06, "learning_rate": 0.0014111750370575083, "loss": 0.0803, "step": 42160 }, { "epoch": 1.06, "learning_rate": 0.00141079818104163, "loss": 0.077, "step": 42170 }, { "epoch": 1.06, "learning_rate": 0.0014104213250257518, "loss": 0.0771, "step": 42180 }, { "epoch": 1.06, "learning_rate": 0.0014100444690098737, "loss": 0.0804, "step": 42190 }, { "epoch": 1.06, "learning_rate": 0.0014096676129939955, "loss": 0.0763, "step": 42200 }, { "epoch": 1.06, "learning_rate": 0.0014092907569781172, "loss": 0.0799, "step": 42210 }, { "epoch": 1.06, "learning_rate": 0.001408913900962239, "loss": 0.0751, "step": 42220 }, { "epoch": 1.06, "learning_rate": 0.001408537044946361, "loss": 0.0793, "step": 42230 }, { "epoch": 1.06, "learning_rate": 0.0014081601889304827, "loss": 0.0746, "step": 42240 }, { "epoch": 1.06, "learning_rate": 0.0014077833329146044, "loss": 0.0778, "step": 42250 }, { "epoch": 1.06, "learning_rate": 0.0014074064768987262, "loss": 0.0791, "step": 42260 }, { "epoch": 1.06, "learning_rate": 0.0014070296208828481, "loss": 0.0787, "step": 42270 }, { "epoch": 1.06, "learning_rate": 0.0014066527648669699, "loss": 0.0759, "step": 42280 }, { "epoch": 1.06, "learning_rate": 0.0014062759088510916, "loss": 0.0782, "step": 42290 }, { "epoch": 1.06, "learning_rate": 0.0014058990528352134, "loss": 0.0803, "step": 42300 }, { "epoch": 1.06, "learning_rate": 0.0014055221968193351, "loss": 0.0776, "step": 42310 }, { "epoch": 1.06, "learning_rate": 0.001405145340803457, "loss": 0.0793, "step": 42320 }, { "epoch": 1.06, "learning_rate": 0.0014047684847875788, "loss": 0.0783, "step": 42330 }, { "epoch": 1.06, "learning_rate": 0.0014043916287717008, "loss": 0.076, "step": 42340 }, { "epoch": 1.06, "learning_rate": 0.0014040147727558223, "loss": 0.0795, "step": 42350 }, { "epoch": 1.06, "learning_rate": 0.0014036379167399443, "loss": 0.0742, "step": 42360 }, { "epoch": 1.06, "learning_rate": 0.001403261060724066, "loss": 0.0784, "step": 42370 }, { "epoch": 1.06, "learning_rate": 0.001402884204708188, "loss": 0.0767, "step": 42380 }, { "epoch": 1.06, "learning_rate": 0.0014025073486923097, "loss": 0.0789, "step": 42390 }, { "epoch": 1.07, "learning_rate": 0.0014021304926764315, "loss": 0.0753, "step": 42400 }, { "epoch": 1.07, "learning_rate": 0.0014017536366605532, "loss": 0.0762, "step": 42410 }, { "epoch": 1.07, "learning_rate": 0.0014013767806446752, "loss": 0.0782, "step": 42420 }, { "epoch": 1.07, "learning_rate": 0.001400999924628797, "loss": 0.0794, "step": 42430 }, { "epoch": 1.07, "learning_rate": 0.0014006230686129187, "loss": 0.0763, "step": 42440 }, { "epoch": 1.07, "learning_rate": 0.0014002462125970404, "loss": 0.0812, "step": 42450 }, { "epoch": 1.07, "learning_rate": 0.0013998693565811624, "loss": 0.0786, "step": 42460 }, { "epoch": 1.07, "learning_rate": 0.0013994925005652841, "loss": 0.0789, "step": 42470 }, { "epoch": 1.07, "learning_rate": 0.0013991156445494059, "loss": 0.0781, "step": 42480 }, { "epoch": 1.07, "learning_rate": 0.0013987387885335276, "loss": 0.0788, "step": 42490 }, { "epoch": 1.07, "learning_rate": 0.0013983619325176493, "loss": 0.0754, "step": 42500 }, { "epoch": 1.07, "eval_cer": 0.6660415484644662, "eval_loss": 0.06667615473270416, "eval_runtime": 90.6952, "eval_samples_per_second": 110.248, "eval_steps_per_second": 6.891, "step": 42500 }, { "epoch": 1.07, "learning_rate": 0.0013979850765017713, "loss": 0.0779, "step": 42510 }, { "epoch": 1.07, "learning_rate": 0.001397608220485893, "loss": 0.079, "step": 42520 }, { "epoch": 1.07, "learning_rate": 0.0013972313644700148, "loss": 0.0788, "step": 42530 }, { "epoch": 1.07, "learning_rate": 0.0013968545084541365, "loss": 0.0782, "step": 42540 }, { "epoch": 1.07, "learning_rate": 0.0013964776524382585, "loss": 0.0774, "step": 42550 }, { "epoch": 1.07, "learning_rate": 0.0013961007964223802, "loss": 0.0759, "step": 42560 }, { "epoch": 1.07, "learning_rate": 0.001395723940406502, "loss": 0.076, "step": 42570 }, { "epoch": 1.07, "learning_rate": 0.0013953470843906237, "loss": 0.082, "step": 42580 }, { "epoch": 1.07, "learning_rate": 0.0013949702283747457, "loss": 0.0797, "step": 42590 }, { "epoch": 1.07, "learning_rate": 0.0013945933723588674, "loss": 0.08, "step": 42600 }, { "epoch": 1.07, "learning_rate": 0.0013942165163429892, "loss": 0.0797, "step": 42610 }, { "epoch": 1.07, "learning_rate": 0.001393839660327111, "loss": 0.0774, "step": 42620 }, { "epoch": 1.07, "learning_rate": 0.001393462804311233, "loss": 0.0782, "step": 42630 }, { "epoch": 1.07, "learning_rate": 0.0013930859482953546, "loss": 0.0805, "step": 42640 }, { "epoch": 1.07, "learning_rate": 0.0013927090922794766, "loss": 0.0779, "step": 42650 }, { "epoch": 1.07, "learning_rate": 0.0013923322362635981, "loss": 0.0794, "step": 42660 }, { "epoch": 1.07, "learning_rate": 0.00139195538024772, "loss": 0.0783, "step": 42670 }, { "epoch": 1.07, "learning_rate": 0.0013915785242318418, "loss": 0.0768, "step": 42680 }, { "epoch": 1.07, "learning_rate": 0.0013912016682159638, "loss": 0.0788, "step": 42690 }, { "epoch": 1.07, "learning_rate": 0.0013908248122000855, "loss": 0.0743, "step": 42700 }, { "epoch": 1.07, "learning_rate": 0.0013904479561842073, "loss": 0.0781, "step": 42710 }, { "epoch": 1.07, "learning_rate": 0.001390071100168329, "loss": 0.078, "step": 42720 }, { "epoch": 1.07, "learning_rate": 0.0013896942441524508, "loss": 0.0773, "step": 42730 }, { "epoch": 1.07, "learning_rate": 0.0013893173881365727, "loss": 0.0761, "step": 42740 }, { "epoch": 1.07, "learning_rate": 0.0013889405321206945, "loss": 0.0763, "step": 42750 }, { "epoch": 1.07, "learning_rate": 0.0013885636761048162, "loss": 0.0746, "step": 42760 }, { "epoch": 1.07, "learning_rate": 0.001388186820088938, "loss": 0.0826, "step": 42770 }, { "epoch": 1.07, "learning_rate": 0.00138780996407306, "loss": 0.0804, "step": 42780 }, { "epoch": 1.08, "learning_rate": 0.0013874331080571817, "loss": 0.0782, "step": 42790 }, { "epoch": 1.08, "learning_rate": 0.0013870562520413034, "loss": 0.0796, "step": 42800 }, { "epoch": 1.08, "learning_rate": 0.0013866793960254252, "loss": 0.0778, "step": 42810 }, { "epoch": 1.08, "learning_rate": 0.0013863025400095471, "loss": 0.0791, "step": 42820 }, { "epoch": 1.08, "learning_rate": 0.0013859256839936689, "loss": 0.0778, "step": 42830 }, { "epoch": 1.08, "learning_rate": 0.0013855488279777906, "loss": 0.0774, "step": 42840 }, { "epoch": 1.08, "learning_rate": 0.0013851719719619124, "loss": 0.0764, "step": 42850 }, { "epoch": 1.08, "learning_rate": 0.0013847951159460343, "loss": 0.0795, "step": 42860 }, { "epoch": 1.08, "learning_rate": 0.001384418259930156, "loss": 0.0789, "step": 42870 }, { "epoch": 1.08, "learning_rate": 0.0013840414039142778, "loss": 0.0786, "step": 42880 }, { "epoch": 1.08, "learning_rate": 0.0013836645478983996, "loss": 0.0779, "step": 42890 }, { "epoch": 1.08, "learning_rate": 0.0013832876918825215, "loss": 0.0746, "step": 42900 }, { "epoch": 1.08, "learning_rate": 0.0013829108358666433, "loss": 0.0786, "step": 42910 }, { "epoch": 1.08, "learning_rate": 0.0013825339798507652, "loss": 0.0782, "step": 42920 }, { "epoch": 1.08, "learning_rate": 0.0013821571238348867, "loss": 0.0765, "step": 42930 }, { "epoch": 1.08, "learning_rate": 0.0013817802678190087, "loss": 0.0765, "step": 42940 }, { "epoch": 1.08, "learning_rate": 0.0013814034118031305, "loss": 0.0782, "step": 42950 }, { "epoch": 1.08, "learning_rate": 0.0013810265557872522, "loss": 0.0778, "step": 42960 }, { "epoch": 1.08, "learning_rate": 0.0013806496997713742, "loss": 0.0795, "step": 42970 }, { "epoch": 1.08, "learning_rate": 0.0013802728437554957, "loss": 0.0776, "step": 42980 }, { "epoch": 1.08, "learning_rate": 0.0013798959877396177, "loss": 0.0786, "step": 42990 }, { "epoch": 1.08, "learning_rate": 0.0013795191317237394, "loss": 0.0762, "step": 43000 }, { "epoch": 1.08, "eval_cer": 0.6656464583613049, "eval_loss": 0.06690527498722076, "eval_runtime": 90.8509, "eval_samples_per_second": 110.059, "eval_steps_per_second": 6.879, "step": 43000 }, { "epoch": 1.08, "learning_rate": 0.0013791422757078614, "loss": 0.0775, "step": 43010 }, { "epoch": 1.08, "learning_rate": 0.0013787654196919829, "loss": 0.0783, "step": 43020 }, { "epoch": 1.08, "learning_rate": 0.0013783885636761048, "loss": 0.083, "step": 43030 }, { "epoch": 1.08, "learning_rate": 0.0013780117076602266, "loss": 0.0778, "step": 43040 }, { "epoch": 1.08, "learning_rate": 0.0013776348516443486, "loss": 0.0799, "step": 43050 }, { "epoch": 1.08, "learning_rate": 0.0013772579956284703, "loss": 0.0757, "step": 43060 }, { "epoch": 1.08, "learning_rate": 0.001376881139612592, "loss": 0.0781, "step": 43070 }, { "epoch": 1.08, "learning_rate": 0.0013765042835967138, "loss": 0.0769, "step": 43080 }, { "epoch": 1.08, "learning_rate": 0.0013761274275808357, "loss": 0.0786, "step": 43090 }, { "epoch": 1.08, "learning_rate": 0.0013757505715649575, "loss": 0.0808, "step": 43100 }, { "epoch": 1.08, "learning_rate": 0.0013753737155490792, "loss": 0.0775, "step": 43110 }, { "epoch": 1.08, "learning_rate": 0.001374996859533201, "loss": 0.0813, "step": 43120 }, { "epoch": 1.08, "learning_rate": 0.001374620003517323, "loss": 0.0799, "step": 43130 }, { "epoch": 1.08, "learning_rate": 0.0013742431475014447, "loss": 0.0771, "step": 43140 }, { "epoch": 1.08, "learning_rate": 0.0013738662914855664, "loss": 0.0771, "step": 43150 }, { "epoch": 1.08, "learning_rate": 0.0013734894354696882, "loss": 0.079, "step": 43160 }, { "epoch": 1.08, "learning_rate": 0.00137311257945381, "loss": 0.0782, "step": 43170 }, { "epoch": 1.08, "learning_rate": 0.0013727357234379319, "loss": 0.0782, "step": 43180 }, { "epoch": 1.09, "learning_rate": 0.0013723588674220536, "loss": 0.0799, "step": 43190 }, { "epoch": 1.09, "learning_rate": 0.0013719820114061754, "loss": 0.0763, "step": 43200 }, { "epoch": 1.09, "learning_rate": 0.0013716051553902971, "loss": 0.0777, "step": 43210 }, { "epoch": 1.09, "learning_rate": 0.001371228299374419, "loss": 0.0809, "step": 43220 }, { "epoch": 1.09, "learning_rate": 0.0013708514433585408, "loss": 0.0774, "step": 43230 }, { "epoch": 1.09, "learning_rate": 0.0013704745873426626, "loss": 0.077, "step": 43240 }, { "epoch": 1.09, "learning_rate": 0.0013700977313267843, "loss": 0.0765, "step": 43250 }, { "epoch": 1.09, "learning_rate": 0.0013697208753109063, "loss": 0.0786, "step": 43260 }, { "epoch": 1.09, "learning_rate": 0.001369344019295028, "loss": 0.0796, "step": 43270 }, { "epoch": 1.09, "learning_rate": 0.00136896716327915, "loss": 0.0771, "step": 43280 }, { "epoch": 1.09, "learning_rate": 0.0013685903072632715, "loss": 0.076, "step": 43290 }, { "epoch": 1.09, "learning_rate": 0.0013682134512473935, "loss": 0.0771, "step": 43300 }, { "epoch": 1.09, "learning_rate": 0.0013678365952315152, "loss": 0.0796, "step": 43310 }, { "epoch": 1.09, "learning_rate": 0.0013674597392156372, "loss": 0.0757, "step": 43320 }, { "epoch": 1.09, "learning_rate": 0.001367082883199759, "loss": 0.0752, "step": 43330 }, { "epoch": 1.09, "learning_rate": 0.0013667060271838807, "loss": 0.0763, "step": 43340 }, { "epoch": 1.09, "learning_rate": 0.0013663291711680024, "loss": 0.0771, "step": 43350 }, { "epoch": 1.09, "learning_rate": 0.0013659523151521244, "loss": 0.0762, "step": 43360 }, { "epoch": 1.09, "learning_rate": 0.0013655754591362461, "loss": 0.0792, "step": 43370 }, { "epoch": 1.09, "learning_rate": 0.0013651986031203679, "loss": 0.0789, "step": 43380 }, { "epoch": 1.09, "learning_rate": 0.0013648217471044896, "loss": 0.0783, "step": 43390 }, { "epoch": 1.09, "learning_rate": 0.0013644448910886113, "loss": 0.0777, "step": 43400 }, { "epoch": 1.09, "learning_rate": 0.0013640680350727333, "loss": 0.0761, "step": 43410 }, { "epoch": 1.09, "learning_rate": 0.001363691179056855, "loss": 0.0774, "step": 43420 }, { "epoch": 1.09, "learning_rate": 0.0013633143230409768, "loss": 0.0757, "step": 43430 }, { "epoch": 1.09, "learning_rate": 0.0013629374670250985, "loss": 0.0771, "step": 43440 }, { "epoch": 1.09, "learning_rate": 0.0013625606110092205, "loss": 0.0791, "step": 43450 }, { "epoch": 1.09, "learning_rate": 0.0013621837549933423, "loss": 0.0754, "step": 43460 }, { "epoch": 1.09, "learning_rate": 0.001361806898977464, "loss": 0.0782, "step": 43470 }, { "epoch": 1.09, "learning_rate": 0.0013614300429615857, "loss": 0.0767, "step": 43480 }, { "epoch": 1.09, "learning_rate": 0.0013610531869457077, "loss": 0.079, "step": 43490 }, { "epoch": 1.09, "learning_rate": 0.0013606763309298294, "loss": 0.075, "step": 43500 }, { "epoch": 1.09, "eval_cer": 0.6659833195942073, "eval_loss": 0.06602948158979416, "eval_runtime": 90.5861, "eval_samples_per_second": 110.381, "eval_steps_per_second": 6.9, "step": 43500 }, { "epoch": 1.09, "learning_rate": 0.0013602994749139512, "loss": 0.0779, "step": 43510 }, { "epoch": 1.09, "learning_rate": 0.001359922618898073, "loss": 0.0743, "step": 43520 }, { "epoch": 1.09, "learning_rate": 0.001359545762882195, "loss": 0.0745, "step": 43530 }, { "epoch": 1.09, "learning_rate": 0.0013591689068663166, "loss": 0.0734, "step": 43540 }, { "epoch": 1.09, "learning_rate": 0.0013587920508504386, "loss": 0.0802, "step": 43550 }, { "epoch": 1.09, "learning_rate": 0.0013584151948345601, "loss": 0.0774, "step": 43560 }, { "epoch": 1.09, "learning_rate": 0.001358038338818682, "loss": 0.0764, "step": 43570 }, { "epoch": 1.09, "learning_rate": 0.0013576614828028038, "loss": 0.0796, "step": 43580 }, { "epoch": 1.1, "learning_rate": 0.0013572846267869258, "loss": 0.0774, "step": 43590 }, { "epoch": 1.1, "learning_rate": 0.0013569077707710473, "loss": 0.0725, "step": 43600 }, { "epoch": 1.1, "learning_rate": 0.001356530914755169, "loss": 0.0786, "step": 43610 }, { "epoch": 1.1, "learning_rate": 0.001356154058739291, "loss": 0.0805, "step": 43620 }, { "epoch": 1.1, "learning_rate": 0.0013557772027234128, "loss": 0.0748, "step": 43630 }, { "epoch": 1.1, "learning_rate": 0.0013554003467075347, "loss": 0.077, "step": 43640 }, { "epoch": 1.1, "learning_rate": 0.0013550234906916563, "loss": 0.0801, "step": 43650 }, { "epoch": 1.1, "learning_rate": 0.0013546466346757782, "loss": 0.0799, "step": 43660 }, { "epoch": 1.1, "learning_rate": 0.0013542697786599, "loss": 0.0758, "step": 43670 }, { "epoch": 1.1, "learning_rate": 0.001353892922644022, "loss": 0.0762, "step": 43680 }, { "epoch": 1.1, "learning_rate": 0.0013535160666281437, "loss": 0.0767, "step": 43690 }, { "epoch": 1.1, "learning_rate": 0.0013531392106122654, "loss": 0.0767, "step": 43700 }, { "epoch": 1.1, "learning_rate": 0.0013527623545963872, "loss": 0.0749, "step": 43710 }, { "epoch": 1.1, "learning_rate": 0.0013523854985805091, "loss": 0.0775, "step": 43720 }, { "epoch": 1.1, "learning_rate": 0.0013520086425646309, "loss": 0.0767, "step": 43730 }, { "epoch": 1.1, "learning_rate": 0.0013516317865487526, "loss": 0.0774, "step": 43740 }, { "epoch": 1.1, "learning_rate": 0.0013512549305328744, "loss": 0.0766, "step": 43750 }, { "epoch": 1.1, "learning_rate": 0.0013508780745169963, "loss": 0.0779, "step": 43760 }, { "epoch": 1.1, "learning_rate": 0.001350501218501118, "loss": 0.0802, "step": 43770 }, { "epoch": 1.1, "learning_rate": 0.0013501243624852398, "loss": 0.0799, "step": 43780 }, { "epoch": 1.1, "learning_rate": 0.0013497475064693616, "loss": 0.0845, "step": 43790 }, { "epoch": 1.1, "learning_rate": 0.0013493706504534835, "loss": 0.0807, "step": 43800 }, { "epoch": 1.1, "learning_rate": 0.0013489937944376053, "loss": 0.0816, "step": 43810 }, { "epoch": 1.1, "learning_rate": 0.001348616938421727, "loss": 0.079, "step": 43820 }, { "epoch": 1.1, "learning_rate": 0.0013482400824058488, "loss": 0.0768, "step": 43830 }, { "epoch": 1.1, "learning_rate": 0.0013478632263899705, "loss": 0.0753, "step": 43840 }, { "epoch": 1.1, "learning_rate": 0.0013474863703740925, "loss": 0.0759, "step": 43850 }, { "epoch": 1.1, "learning_rate": 0.0013471095143582142, "loss": 0.0804, "step": 43860 }, { "epoch": 1.1, "learning_rate": 0.001346732658342336, "loss": 0.082, "step": 43870 }, { "epoch": 1.1, "learning_rate": 0.0013463558023264577, "loss": 0.0809, "step": 43880 }, { "epoch": 1.1, "learning_rate": 0.0013459789463105797, "loss": 0.0835, "step": 43890 }, { "epoch": 1.1, "learning_rate": 0.0013456020902947014, "loss": 0.0748, "step": 43900 }, { "epoch": 1.1, "learning_rate": 0.0013452252342788234, "loss": 0.0787, "step": 43910 }, { "epoch": 1.1, "learning_rate": 0.0013448483782629449, "loss": 0.0818, "step": 43920 }, { "epoch": 1.1, "learning_rate": 0.0013444715222470669, "loss": 0.077, "step": 43930 }, { "epoch": 1.1, "learning_rate": 0.0013440946662311886, "loss": 0.0752, "step": 43940 }, { "epoch": 1.1, "learning_rate": 0.0013437178102153106, "loss": 0.074, "step": 43950 }, { "epoch": 1.1, "learning_rate": 0.0013433409541994323, "loss": 0.0759, "step": 43960 }, { "epoch": 1.1, "learning_rate": 0.001342964098183554, "loss": 0.078, "step": 43970 }, { "epoch": 1.1, "learning_rate": 0.0013425872421676758, "loss": 0.0755, "step": 43980 }, { "epoch": 1.11, "learning_rate": 0.0013422103861517978, "loss": 0.0779, "step": 43990 }, { "epoch": 1.11, "learning_rate": 0.0013418335301359195, "loss": 0.0816, "step": 44000 }, { "epoch": 1.11, "eval_cer": 0.6656503082039665, "eval_loss": 0.06611749529838562, "eval_runtime": 90.5698, "eval_samples_per_second": 110.401, "eval_steps_per_second": 6.901, "step": 44000 }, { "epoch": 1.11, "learning_rate": 0.0013414566741200412, "loss": 0.0785, "step": 44010 }, { "epoch": 1.11, "learning_rate": 0.001341079818104163, "loss": 0.0781, "step": 44020 }, { "epoch": 1.11, "learning_rate": 0.001340702962088285, "loss": 0.0765, "step": 44030 }, { "epoch": 1.11, "learning_rate": 0.0013403261060724067, "loss": 0.0816, "step": 44040 }, { "epoch": 1.11, "learning_rate": 0.0013399492500565284, "loss": 0.0768, "step": 44050 }, { "epoch": 1.11, "learning_rate": 0.0013395723940406502, "loss": 0.0786, "step": 44060 }, { "epoch": 1.11, "learning_rate": 0.001339195538024772, "loss": 0.0775, "step": 44070 }, { "epoch": 1.11, "learning_rate": 0.0013388186820088939, "loss": 0.0799, "step": 44080 }, { "epoch": 1.11, "learning_rate": 0.0013384418259930156, "loss": 0.0773, "step": 44090 }, { "epoch": 1.11, "learning_rate": 0.0013380649699771374, "loss": 0.076, "step": 44100 }, { "epoch": 1.11, "learning_rate": 0.0013376881139612591, "loss": 0.0775, "step": 44110 }, { "epoch": 1.11, "learning_rate": 0.001337311257945381, "loss": 0.079, "step": 44120 }, { "epoch": 1.11, "learning_rate": 0.0013369344019295028, "loss": 0.0793, "step": 44130 }, { "epoch": 1.11, "learning_rate": 0.0013365575459136246, "loss": 0.0766, "step": 44140 }, { "epoch": 1.11, "learning_rate": 0.0013361806898977463, "loss": 0.078, "step": 44150 }, { "epoch": 1.11, "learning_rate": 0.0013358038338818683, "loss": 0.0766, "step": 44160 }, { "epoch": 1.11, "learning_rate": 0.00133542697786599, "loss": 0.0778, "step": 44170 }, { "epoch": 1.11, "learning_rate": 0.001335050121850112, "loss": 0.0754, "step": 44180 }, { "epoch": 1.11, "learning_rate": 0.0013346732658342335, "loss": 0.0758, "step": 44190 }, { "epoch": 1.11, "learning_rate": 0.0013342964098183555, "loss": 0.0773, "step": 44200 }, { "epoch": 1.11, "learning_rate": 0.0013339195538024772, "loss": 0.0765, "step": 44210 }, { "epoch": 1.11, "learning_rate": 0.0013335426977865992, "loss": 0.0818, "step": 44220 }, { "epoch": 1.11, "learning_rate": 0.0013331658417707207, "loss": 0.0779, "step": 44230 }, { "epoch": 1.11, "learning_rate": 0.0013327889857548427, "loss": 0.0762, "step": 44240 }, { "epoch": 1.11, "learning_rate": 0.0013324121297389644, "loss": 0.0821, "step": 44250 }, { "epoch": 1.11, "learning_rate": 0.0013320352737230864, "loss": 0.0795, "step": 44260 }, { "epoch": 1.11, "learning_rate": 0.0013316584177072081, "loss": 0.0778, "step": 44270 }, { "epoch": 1.11, "learning_rate": 0.0013312815616913296, "loss": 0.0735, "step": 44280 }, { "epoch": 1.11, "learning_rate": 0.0013309047056754516, "loss": 0.0784, "step": 44290 }, { "epoch": 1.11, "learning_rate": 0.0013305278496595734, "loss": 0.0766, "step": 44300 }, { "epoch": 1.11, "learning_rate": 0.0013301509936436953, "loss": 0.075, "step": 44310 }, { "epoch": 1.11, "learning_rate": 0.001329774137627817, "loss": 0.0754, "step": 44320 }, { "epoch": 1.11, "learning_rate": 0.0013293972816119388, "loss": 0.0773, "step": 44330 }, { "epoch": 1.11, "learning_rate": 0.0013290204255960605, "loss": 0.0754, "step": 44340 }, { "epoch": 1.11, "learning_rate": 0.0013286435695801825, "loss": 0.0759, "step": 44350 }, { "epoch": 1.11, "learning_rate": 0.0013282667135643043, "loss": 0.077, "step": 44360 }, { "epoch": 1.11, "learning_rate": 0.001327889857548426, "loss": 0.0807, "step": 44370 }, { "epoch": 1.11, "learning_rate": 0.0013275130015325477, "loss": 0.0761, "step": 44380 }, { "epoch": 1.12, "learning_rate": 0.0013271361455166697, "loss": 0.0758, "step": 44390 }, { "epoch": 1.12, "learning_rate": 0.0013267592895007914, "loss": 0.0725, "step": 44400 }, { "epoch": 1.12, "learning_rate": 0.0013263824334849132, "loss": 0.0731, "step": 44410 }, { "epoch": 1.12, "learning_rate": 0.001326005577469035, "loss": 0.0772, "step": 44420 }, { "epoch": 1.12, "learning_rate": 0.001325628721453157, "loss": 0.0792, "step": 44430 }, { "epoch": 1.12, "learning_rate": 0.0013252518654372786, "loss": 0.0747, "step": 44440 }, { "epoch": 1.12, "learning_rate": 0.0013248750094214004, "loss": 0.0769, "step": 44450 }, { "epoch": 1.12, "learning_rate": 0.0013244981534055221, "loss": 0.0736, "step": 44460 }, { "epoch": 1.12, "learning_rate": 0.001324121297389644, "loss": 0.074, "step": 44470 }, { "epoch": 1.12, "learning_rate": 0.0013237444413737658, "loss": 0.0762, "step": 44480 }, { "epoch": 1.12, "learning_rate": 0.0013233675853578878, "loss": 0.0791, "step": 44490 }, { "epoch": 1.12, "learning_rate": 0.0013229907293420093, "loss": 0.0758, "step": 44500 }, { "epoch": 1.12, "eval_cer": 0.6656565641982919, "eval_loss": 0.06587806344032288, "eval_runtime": 90.6347, "eval_samples_per_second": 110.322, "eval_steps_per_second": 6.896, "step": 44500 }, { "epoch": 1.12, "learning_rate": 0.001322613873326131, "loss": 0.0772, "step": 44510 }, { "epoch": 1.12, "learning_rate": 0.001322237017310253, "loss": 0.08, "step": 44520 }, { "epoch": 1.12, "learning_rate": 0.0013218601612943748, "loss": 0.075, "step": 44530 }, { "epoch": 1.12, "learning_rate": 0.0013214833052784967, "loss": 0.0768, "step": 44540 }, { "epoch": 1.12, "learning_rate": 0.0013211064492626183, "loss": 0.0809, "step": 44550 }, { "epoch": 1.12, "learning_rate": 0.0013207295932467402, "loss": 0.0782, "step": 44560 }, { "epoch": 1.12, "learning_rate": 0.001320352737230862, "loss": 0.0751, "step": 44570 }, { "epoch": 1.12, "learning_rate": 0.001319975881214984, "loss": 0.0754, "step": 44580 }, { "epoch": 1.12, "learning_rate": 0.0013195990251991057, "loss": 0.0765, "step": 44590 }, { "epoch": 1.12, "learning_rate": 0.0013192221691832274, "loss": 0.0775, "step": 44600 }, { "epoch": 1.12, "learning_rate": 0.0013188453131673492, "loss": 0.0762, "step": 44610 }, { "epoch": 1.12, "learning_rate": 0.0013184684571514711, "loss": 0.0778, "step": 44620 }, { "epoch": 1.12, "learning_rate": 0.0013180916011355929, "loss": 0.0807, "step": 44630 }, { "epoch": 1.12, "learning_rate": 0.0013177147451197146, "loss": 0.0805, "step": 44640 }, { "epoch": 1.12, "learning_rate": 0.0013173378891038364, "loss": 0.0761, "step": 44650 }, { "epoch": 1.12, "learning_rate": 0.0013169610330879583, "loss": 0.0762, "step": 44660 }, { "epoch": 1.12, "learning_rate": 0.00131658417707208, "loss": 0.0786, "step": 44670 }, { "epoch": 1.12, "learning_rate": 0.0013162073210562018, "loss": 0.0774, "step": 44680 }, { "epoch": 1.12, "learning_rate": 0.0013158304650403236, "loss": 0.0764, "step": 44690 }, { "epoch": 1.12, "learning_rate": 0.0013154536090244455, "loss": 0.0752, "step": 44700 }, { "epoch": 1.12, "learning_rate": 0.0013150767530085673, "loss": 0.0791, "step": 44710 }, { "epoch": 1.12, "learning_rate": 0.001314699896992689, "loss": 0.077, "step": 44720 }, { "epoch": 1.12, "learning_rate": 0.0013143230409768108, "loss": 0.0777, "step": 44730 }, { "epoch": 1.12, "learning_rate": 0.0013139461849609325, "loss": 0.0777, "step": 44740 }, { "epoch": 1.12, "learning_rate": 0.0013135693289450545, "loss": 0.0753, "step": 44750 }, { "epoch": 1.12, "learning_rate": 0.0013131924729291762, "loss": 0.0751, "step": 44760 }, { "epoch": 1.12, "learning_rate": 0.001312815616913298, "loss": 0.078, "step": 44770 }, { "epoch": 1.13, "learning_rate": 0.0013124387608974197, "loss": 0.0778, "step": 44780 }, { "epoch": 1.13, "learning_rate": 0.0013120619048815417, "loss": 0.0753, "step": 44790 }, { "epoch": 1.13, "learning_rate": 0.0013116850488656634, "loss": 0.0761, "step": 44800 }, { "epoch": 1.13, "learning_rate": 0.0013113081928497851, "loss": 0.0741, "step": 44810 }, { "epoch": 1.13, "learning_rate": 0.001310931336833907, "loss": 0.0784, "step": 44820 }, { "epoch": 1.13, "learning_rate": 0.0013105544808180289, "loss": 0.0736, "step": 44830 }, { "epoch": 1.13, "learning_rate": 0.0013101776248021506, "loss": 0.0766, "step": 44840 }, { "epoch": 1.13, "learning_rate": 0.0013098007687862726, "loss": 0.0757, "step": 44850 }, { "epoch": 1.13, "learning_rate": 0.001309423912770394, "loss": 0.0776, "step": 44860 }, { "epoch": 1.13, "learning_rate": 0.001309047056754516, "loss": 0.078, "step": 44870 }, { "epoch": 1.13, "learning_rate": 0.0013086702007386378, "loss": 0.0772, "step": 44880 }, { "epoch": 1.13, "learning_rate": 0.0013082933447227598, "loss": 0.0765, "step": 44890 }, { "epoch": 1.13, "learning_rate": 0.0013079164887068815, "loss": 0.0778, "step": 44900 }, { "epoch": 1.13, "learning_rate": 0.0013075396326910032, "loss": 0.0754, "step": 44910 }, { "epoch": 1.13, "learning_rate": 0.001307162776675125, "loss": 0.0739, "step": 44920 }, { "epoch": 1.13, "learning_rate": 0.001306785920659247, "loss": 0.0745, "step": 44930 }, { "epoch": 1.13, "learning_rate": 0.0013064090646433687, "loss": 0.0804, "step": 44940 }, { "epoch": 1.13, "learning_rate": 0.0013060322086274904, "loss": 0.0756, "step": 44950 }, { "epoch": 1.13, "learning_rate": 0.0013056553526116122, "loss": 0.0743, "step": 44960 }, { "epoch": 1.13, "learning_rate": 0.001305278496595734, "loss": 0.0764, "step": 44970 }, { "epoch": 1.13, "learning_rate": 0.0013049016405798559, "loss": 0.0746, "step": 44980 }, { "epoch": 1.13, "learning_rate": 0.0013045247845639776, "loss": 0.073, "step": 44990 }, { "epoch": 1.13, "learning_rate": 0.0013041479285480994, "loss": 0.0767, "step": 45000 }, { "epoch": 1.13, "eval_cer": 0.6657903462307875, "eval_loss": 0.06532227247953415, "eval_runtime": 90.6615, "eval_samples_per_second": 110.289, "eval_steps_per_second": 6.894, "step": 45000 }, { "epoch": 1.13, "learning_rate": 0.0013037710725322211, "loss": 0.0783, "step": 45010 }, { "epoch": 1.13, "learning_rate": 0.001303394216516343, "loss": 0.075, "step": 45020 }, { "epoch": 1.13, "learning_rate": 0.0013030173605004648, "loss": 0.0787, "step": 45030 }, { "epoch": 1.13, "learning_rate": 0.0013026405044845866, "loss": 0.078, "step": 45040 }, { "epoch": 1.13, "learning_rate": 0.0013022636484687083, "loss": 0.0798, "step": 45050 }, { "epoch": 1.13, "learning_rate": 0.0013018867924528303, "loss": 0.0757, "step": 45060 }, { "epoch": 1.13, "learning_rate": 0.001301509936436952, "loss": 0.0786, "step": 45070 }, { "epoch": 1.13, "learning_rate": 0.0013011330804210738, "loss": 0.0777, "step": 45080 }, { "epoch": 1.13, "learning_rate": 0.0013007562244051955, "loss": 0.0785, "step": 45090 }, { "epoch": 1.13, "learning_rate": 0.0013003793683893175, "loss": 0.0769, "step": 45100 }, { "epoch": 1.13, "learning_rate": 0.0013000025123734392, "loss": 0.0773, "step": 45110 }, { "epoch": 1.13, "learning_rate": 0.0012996256563575612, "loss": 0.0759, "step": 45120 }, { "epoch": 1.13, "learning_rate": 0.0012992488003416827, "loss": 0.0736, "step": 45130 }, { "epoch": 1.13, "learning_rate": 0.0012988719443258047, "loss": 0.0748, "step": 45140 }, { "epoch": 1.13, "learning_rate": 0.0012984950883099264, "loss": 0.0784, "step": 45150 }, { "epoch": 1.13, "learning_rate": 0.0012981182322940484, "loss": 0.0771, "step": 45160 }, { "epoch": 1.13, "learning_rate": 0.0012977413762781701, "loss": 0.0777, "step": 45170 }, { "epoch": 1.14, "learning_rate": 0.0012973645202622917, "loss": 0.0752, "step": 45180 }, { "epoch": 1.14, "learning_rate": 0.0012969876642464136, "loss": 0.0799, "step": 45190 }, { "epoch": 1.14, "learning_rate": 0.0012966108082305354, "loss": 0.0744, "step": 45200 }, { "epoch": 1.14, "learning_rate": 0.0012962339522146573, "loss": 0.0783, "step": 45210 }, { "epoch": 1.14, "learning_rate": 0.0012958570961987788, "loss": 0.0738, "step": 45220 }, { "epoch": 1.14, "learning_rate": 0.0012954802401829008, "loss": 0.0774, "step": 45230 }, { "epoch": 1.14, "learning_rate": 0.0012951033841670226, "loss": 0.0768, "step": 45240 }, { "epoch": 1.14, "learning_rate": 0.0012947265281511445, "loss": 0.0775, "step": 45250 }, { "epoch": 1.14, "learning_rate": 0.0012943496721352663, "loss": 0.0775, "step": 45260 }, { "epoch": 1.14, "learning_rate": 0.001293972816119388, "loss": 0.0772, "step": 45270 }, { "epoch": 1.14, "learning_rate": 0.0012935959601035097, "loss": 0.0772, "step": 45280 }, { "epoch": 1.14, "learning_rate": 0.0012932191040876317, "loss": 0.0748, "step": 45290 }, { "epoch": 1.14, "learning_rate": 0.0012928422480717535, "loss": 0.0769, "step": 45300 }, { "epoch": 1.14, "learning_rate": 0.0012924653920558752, "loss": 0.0765, "step": 45310 }, { "epoch": 1.14, "learning_rate": 0.001292088536039997, "loss": 0.0774, "step": 45320 }, { "epoch": 1.14, "learning_rate": 0.001291711680024119, "loss": 0.0758, "step": 45330 }, { "epoch": 1.14, "learning_rate": 0.0012913348240082406, "loss": 0.0754, "step": 45340 }, { "epoch": 1.14, "learning_rate": 0.0012909579679923624, "loss": 0.0751, "step": 45350 }, { "epoch": 1.14, "learning_rate": 0.0012905811119764841, "loss": 0.0809, "step": 45360 }, { "epoch": 1.14, "learning_rate": 0.001290204255960606, "loss": 0.0726, "step": 45370 }, { "epoch": 1.14, "learning_rate": 0.0012898273999447278, "loss": 0.0749, "step": 45380 }, { "epoch": 1.14, "learning_rate": 0.0012894505439288496, "loss": 0.0784, "step": 45390 }, { "epoch": 1.14, "learning_rate": 0.0012890736879129713, "loss": 0.0771, "step": 45400 }, { "epoch": 1.14, "learning_rate": 0.001288696831897093, "loss": 0.0773, "step": 45410 }, { "epoch": 1.14, "learning_rate": 0.001288319975881215, "loss": 0.0773, "step": 45420 }, { "epoch": 1.14, "learning_rate": 0.0012879431198653368, "loss": 0.0764, "step": 45430 }, { "epoch": 1.14, "learning_rate": 0.0012875662638494585, "loss": 0.0747, "step": 45440 }, { "epoch": 1.14, "learning_rate": 0.0012871894078335803, "loss": 0.0773, "step": 45450 }, { "epoch": 1.14, "learning_rate": 0.0012868125518177022, "loss": 0.0784, "step": 45460 }, { "epoch": 1.14, "learning_rate": 0.001286435695801824, "loss": 0.0732, "step": 45470 }, { "epoch": 1.14, "learning_rate": 0.001286058839785946, "loss": 0.0737, "step": 45480 }, { "epoch": 1.14, "learning_rate": 0.0012856819837700675, "loss": 0.0778, "step": 45490 }, { "epoch": 1.14, "learning_rate": 0.0012853051277541894, "loss": 0.076, "step": 45500 }, { "epoch": 1.14, "eval_cer": 0.6656166220806763, "eval_loss": 0.06491339206695557, "eval_runtime": 90.6455, "eval_samples_per_second": 110.309, "eval_steps_per_second": 6.895, "step": 45500 }, { "epoch": 1.14, "learning_rate": 0.0012849282717383112, "loss": 0.0753, "step": 45510 }, { "epoch": 1.14, "learning_rate": 0.0012845514157224331, "loss": 0.0766, "step": 45520 }, { "epoch": 1.14, "learning_rate": 0.0012841745597065549, "loss": 0.0741, "step": 45530 }, { "epoch": 1.14, "learning_rate": 0.0012837977036906766, "loss": 0.077, "step": 45540 }, { "epoch": 1.14, "learning_rate": 0.0012834208476747984, "loss": 0.0744, "step": 45550 }, { "epoch": 1.14, "learning_rate": 0.0012830439916589203, "loss": 0.079, "step": 45560 }, { "epoch": 1.14, "learning_rate": 0.001282667135643042, "loss": 0.0796, "step": 45570 }, { "epoch": 1.15, "learning_rate": 0.0012822902796271638, "loss": 0.0769, "step": 45580 }, { "epoch": 1.15, "learning_rate": 0.0012819134236112856, "loss": 0.0753, "step": 45590 }, { "epoch": 1.15, "learning_rate": 0.0012815365675954075, "loss": 0.0754, "step": 45600 }, { "epoch": 1.15, "learning_rate": 0.0012811597115795293, "loss": 0.0769, "step": 45610 }, { "epoch": 1.15, "learning_rate": 0.001280782855563651, "loss": 0.0733, "step": 45620 }, { "epoch": 1.15, "learning_rate": 0.0012804059995477728, "loss": 0.0752, "step": 45630 }, { "epoch": 1.15, "learning_rate": 0.0012800291435318945, "loss": 0.0773, "step": 45640 }, { "epoch": 1.15, "learning_rate": 0.0012796522875160165, "loss": 0.0754, "step": 45650 }, { "epoch": 1.15, "learning_rate": 0.0012792754315001382, "loss": 0.08, "step": 45660 }, { "epoch": 1.15, "learning_rate": 0.00127889857548426, "loss": 0.0804, "step": 45670 }, { "epoch": 1.15, "learning_rate": 0.0012785217194683817, "loss": 0.0743, "step": 45680 }, { "epoch": 1.15, "learning_rate": 0.0012781448634525037, "loss": 0.0785, "step": 45690 }, { "epoch": 1.15, "learning_rate": 0.0012777680074366254, "loss": 0.0746, "step": 45700 }, { "epoch": 1.15, "learning_rate": 0.0012773911514207472, "loss": 0.0781, "step": 45710 }, { "epoch": 1.15, "learning_rate": 0.001277014295404869, "loss": 0.0751, "step": 45720 }, { "epoch": 1.15, "learning_rate": 0.0012766374393889909, "loss": 0.0732, "step": 45730 }, { "epoch": 1.15, "learning_rate": 0.0012762605833731126, "loss": 0.078, "step": 45740 }, { "epoch": 1.15, "learning_rate": 0.0012758837273572346, "loss": 0.0755, "step": 45750 }, { "epoch": 1.15, "learning_rate": 0.001275506871341356, "loss": 0.0738, "step": 45760 }, { "epoch": 1.15, "learning_rate": 0.001275130015325478, "loss": 0.0758, "step": 45770 }, { "epoch": 1.15, "learning_rate": 0.0012747531593095998, "loss": 0.0788, "step": 45780 }, { "epoch": 1.15, "learning_rate": 0.0012743763032937218, "loss": 0.0747, "step": 45790 }, { "epoch": 1.15, "learning_rate": 0.0012739994472778433, "loss": 0.0738, "step": 45800 }, { "epoch": 1.15, "learning_rate": 0.0012736225912619652, "loss": 0.0766, "step": 45810 }, { "epoch": 1.15, "learning_rate": 0.001273245735246087, "loss": 0.0775, "step": 45820 }, { "epoch": 1.15, "learning_rate": 0.001272868879230209, "loss": 0.0764, "step": 45830 }, { "epoch": 1.15, "learning_rate": 0.0012724920232143307, "loss": 0.0763, "step": 45840 }, { "epoch": 1.15, "learning_rate": 0.0012721151671984522, "loss": 0.0764, "step": 45850 }, { "epoch": 1.15, "learning_rate": 0.0012717383111825742, "loss": 0.0783, "step": 45860 }, { "epoch": 1.15, "learning_rate": 0.001271361455166696, "loss": 0.0761, "step": 45870 }, { "epoch": 1.15, "learning_rate": 0.001270984599150818, "loss": 0.0754, "step": 45880 }, { "epoch": 1.15, "learning_rate": 0.0012706077431349396, "loss": 0.0747, "step": 45890 }, { "epoch": 1.15, "learning_rate": 0.0012702308871190614, "loss": 0.0734, "step": 45900 }, { "epoch": 1.15, "learning_rate": 0.0012698540311031831, "loss": 0.0731, "step": 45910 }, { "epoch": 1.15, "learning_rate": 0.001269477175087305, "loss": 0.0764, "step": 45920 }, { "epoch": 1.15, "learning_rate": 0.0012691003190714268, "loss": 0.0768, "step": 45930 }, { "epoch": 1.15, "learning_rate": 0.0012687234630555486, "loss": 0.0753, "step": 45940 }, { "epoch": 1.15, "learning_rate": 0.0012683466070396703, "loss": 0.077, "step": 45950 }, { "epoch": 1.15, "learning_rate": 0.0012679697510237923, "loss": 0.0747, "step": 45960 }, { "epoch": 1.15, "learning_rate": 0.001267592895007914, "loss": 0.0733, "step": 45970 }, { "epoch": 1.16, "learning_rate": 0.0012672160389920358, "loss": 0.0791, "step": 45980 }, { "epoch": 1.16, "learning_rate": 0.0012668391829761575, "loss": 0.0772, "step": 45990 }, { "epoch": 1.16, "learning_rate": 0.0012664623269602795, "loss": 0.0727, "step": 46000 }, { "epoch": 1.16, "eval_cer": 0.6655747550417299, "eval_loss": 0.06513096392154694, "eval_runtime": 90.5203, "eval_samples_per_second": 110.461, "eval_steps_per_second": 6.905, "step": 46000 }, { "epoch": 1.16, "learning_rate": 0.0012660854709444012, "loss": 0.0725, "step": 46010 }, { "epoch": 1.16, "learning_rate": 0.001265708614928523, "loss": 0.0729, "step": 46020 }, { "epoch": 1.16, "learning_rate": 0.0012653317589126447, "loss": 0.0771, "step": 46030 }, { "epoch": 1.16, "learning_rate": 0.0012649549028967667, "loss": 0.0748, "step": 46040 }, { "epoch": 1.16, "learning_rate": 0.0012645780468808884, "loss": 0.0758, "step": 46050 }, { "epoch": 1.16, "learning_rate": 0.0012642011908650102, "loss": 0.0764, "step": 46060 }, { "epoch": 1.16, "learning_rate": 0.001263824334849132, "loss": 0.0768, "step": 46070 }, { "epoch": 1.16, "learning_rate": 0.0012634474788332537, "loss": 0.074, "step": 46080 }, { "epoch": 1.16, "learning_rate": 0.0012630706228173756, "loss": 0.0755, "step": 46090 }, { "epoch": 1.16, "learning_rate": 0.0012626937668014974, "loss": 0.0783, "step": 46100 }, { "epoch": 1.16, "learning_rate": 0.0012623169107856193, "loss": 0.0742, "step": 46110 }, { "epoch": 1.16, "learning_rate": 0.0012619400547697408, "loss": 0.0756, "step": 46120 }, { "epoch": 1.16, "learning_rate": 0.0012615631987538628, "loss": 0.0765, "step": 46130 }, { "epoch": 1.16, "learning_rate": 0.0012611863427379846, "loss": 0.0752, "step": 46140 }, { "epoch": 1.16, "learning_rate": 0.0012608094867221065, "loss": 0.077, "step": 46150 }, { "epoch": 1.16, "learning_rate": 0.0012604326307062283, "loss": 0.0764, "step": 46160 }, { "epoch": 1.16, "learning_rate": 0.00126005577469035, "loss": 0.0756, "step": 46170 }, { "epoch": 1.16, "learning_rate": 0.0012596789186744718, "loss": 0.0721, "step": 46180 }, { "epoch": 1.16, "learning_rate": 0.0012593020626585937, "loss": 0.0757, "step": 46190 }, { "epoch": 1.16, "learning_rate": 0.0012589252066427155, "loss": 0.0774, "step": 46200 }, { "epoch": 1.16, "learning_rate": 0.0012585483506268372, "loss": 0.078, "step": 46210 }, { "epoch": 1.16, "learning_rate": 0.001258171494610959, "loss": 0.0778, "step": 46220 }, { "epoch": 1.16, "learning_rate": 0.001257794638595081, "loss": 0.0741, "step": 46230 }, { "epoch": 1.16, "learning_rate": 0.0012574177825792027, "loss": 0.0783, "step": 46240 }, { "epoch": 1.16, "learning_rate": 0.0012570409265633244, "loss": 0.0737, "step": 46250 }, { "epoch": 1.16, "learning_rate": 0.0012566640705474461, "loss": 0.0769, "step": 46260 }, { "epoch": 1.16, "learning_rate": 0.001256287214531568, "loss": 0.076, "step": 46270 }, { "epoch": 1.16, "learning_rate": 0.0012559103585156898, "loss": 0.0752, "step": 46280 }, { "epoch": 1.16, "learning_rate": 0.0012555335024998116, "loss": 0.0792, "step": 46290 }, { "epoch": 1.16, "learning_rate": 0.0012551566464839333, "loss": 0.0733, "step": 46300 }, { "epoch": 1.16, "learning_rate": 0.001254779790468055, "loss": 0.0786, "step": 46310 }, { "epoch": 1.16, "learning_rate": 0.001254402934452177, "loss": 0.0757, "step": 46320 }, { "epoch": 1.16, "learning_rate": 0.0012540260784362988, "loss": 0.0768, "step": 46330 }, { "epoch": 1.16, "learning_rate": 0.0012536492224204205, "loss": 0.0742, "step": 46340 }, { "epoch": 1.16, "learning_rate": 0.0012532723664045423, "loss": 0.0765, "step": 46350 }, { "epoch": 1.16, "learning_rate": 0.0012528955103886642, "loss": 0.0782, "step": 46360 }, { "epoch": 1.16, "learning_rate": 0.001252518654372786, "loss": 0.0715, "step": 46370 }, { "epoch": 1.17, "learning_rate": 0.0012521417983569077, "loss": 0.074, "step": 46380 }, { "epoch": 1.17, "learning_rate": 0.0012517649423410295, "loss": 0.0776, "step": 46390 }, { "epoch": 1.17, "learning_rate": 0.0012513880863251514, "loss": 0.0741, "step": 46400 }, { "epoch": 1.17, "learning_rate": 0.0012510112303092732, "loss": 0.076, "step": 46410 }, { "epoch": 1.17, "learning_rate": 0.0012506343742933951, "loss": 0.0759, "step": 46420 }, { "epoch": 1.17, "learning_rate": 0.0012502575182775167, "loss": 0.0745, "step": 46430 }, { "epoch": 1.17, "learning_rate": 0.0012498806622616386, "loss": 0.0732, "step": 46440 }, { "epoch": 1.17, "learning_rate": 0.0012495038062457604, "loss": 0.0764, "step": 46450 }, { "epoch": 1.17, "learning_rate": 0.0012491269502298823, "loss": 0.0717, "step": 46460 }, { "epoch": 1.17, "learning_rate": 0.001248750094214004, "loss": 0.0757, "step": 46470 }, { "epoch": 1.17, "learning_rate": 0.0012483732381981258, "loss": 0.0775, "step": 46480 }, { "epoch": 1.17, "learning_rate": 0.0012479963821822476, "loss": 0.0779, "step": 46490 }, { "epoch": 1.17, "learning_rate": 0.0012476195261663693, "loss": 0.0768, "step": 46500 }, { "epoch": 1.17, "eval_cer": 0.6655930417943732, "eval_loss": 0.06406976282596588, "eval_runtime": 90.5517, "eval_samples_per_second": 110.423, "eval_steps_per_second": 6.902, "step": 46500 }, { "epoch": 1.17, "learning_rate": 0.0012472426701504913, "loss": 0.0776, "step": 46510 }, { "epoch": 1.17, "learning_rate": 0.001246865814134613, "loss": 0.0767, "step": 46520 }, { "epoch": 1.17, "learning_rate": 0.0012464889581187348, "loss": 0.0754, "step": 46530 }, { "epoch": 1.17, "learning_rate": 0.0012461121021028565, "loss": 0.0757, "step": 46540 }, { "epoch": 1.17, "learning_rate": 0.0012457352460869785, "loss": 0.0754, "step": 46550 }, { "epoch": 1.17, "learning_rate": 0.0012453583900711002, "loss": 0.0723, "step": 46560 }, { "epoch": 1.17, "learning_rate": 0.001244981534055222, "loss": 0.0809, "step": 46570 }, { "epoch": 1.17, "learning_rate": 0.0012446046780393437, "loss": 0.0741, "step": 46580 }, { "epoch": 1.17, "learning_rate": 0.0012442278220234657, "loss": 0.0764, "step": 46590 }, { "epoch": 1.17, "learning_rate": 0.0012438509660075874, "loss": 0.0733, "step": 46600 }, { "epoch": 1.17, "learning_rate": 0.0012434741099917092, "loss": 0.0768, "step": 46610 }, { "epoch": 1.17, "learning_rate": 0.001243097253975831, "loss": 0.077, "step": 46620 }, { "epoch": 1.17, "learning_rate": 0.0012427203979599529, "loss": 0.0778, "step": 46630 }, { "epoch": 1.17, "learning_rate": 0.0012423435419440746, "loss": 0.0734, "step": 46640 }, { "epoch": 1.17, "learning_rate": 0.0012419666859281964, "loss": 0.08, "step": 46650 }, { "epoch": 1.17, "learning_rate": 0.001241589829912318, "loss": 0.0748, "step": 46660 }, { "epoch": 1.17, "learning_rate": 0.00124121297389644, "loss": 0.0786, "step": 46670 }, { "epoch": 1.17, "learning_rate": 0.0012408361178805618, "loss": 0.075, "step": 46680 }, { "epoch": 1.17, "learning_rate": 0.0012404592618646838, "loss": 0.0733, "step": 46690 }, { "epoch": 1.17, "learning_rate": 0.0012400824058488053, "loss": 0.0762, "step": 46700 }, { "epoch": 1.17, "learning_rate": 0.0012397055498329273, "loss": 0.0772, "step": 46710 }, { "epoch": 1.17, "learning_rate": 0.001239328693817049, "loss": 0.075, "step": 46720 }, { "epoch": 1.17, "learning_rate": 0.0012389518378011707, "loss": 0.0785, "step": 46730 }, { "epoch": 1.17, "learning_rate": 0.0012385749817852927, "loss": 0.0727, "step": 46740 }, { "epoch": 1.17, "learning_rate": 0.0012381981257694142, "loss": 0.0744, "step": 46750 }, { "epoch": 1.17, "learning_rate": 0.0012378212697535362, "loss": 0.0724, "step": 46760 }, { "epoch": 1.18, "learning_rate": 0.001237444413737658, "loss": 0.0806, "step": 46770 }, { "epoch": 1.18, "learning_rate": 0.00123706755772178, "loss": 0.0719, "step": 46780 }, { "epoch": 1.18, "learning_rate": 0.0012366907017059014, "loss": 0.0752, "step": 46790 }, { "epoch": 1.18, "learning_rate": 0.0012363138456900234, "loss": 0.0737, "step": 46800 }, { "epoch": 1.18, "learning_rate": 0.0012359369896741451, "loss": 0.0777, "step": 46810 }, { "epoch": 1.18, "learning_rate": 0.001235560133658267, "loss": 0.0728, "step": 46820 }, { "epoch": 1.18, "learning_rate": 0.0012351832776423888, "loss": 0.0768, "step": 46830 }, { "epoch": 1.18, "learning_rate": 0.0012348064216265106, "loss": 0.0739, "step": 46840 }, { "epoch": 1.18, "learning_rate": 0.0012344295656106323, "loss": 0.0794, "step": 46850 }, { "epoch": 1.18, "learning_rate": 0.0012340527095947543, "loss": 0.075, "step": 46860 }, { "epoch": 1.18, "learning_rate": 0.001233675853578876, "loss": 0.0712, "step": 46870 }, { "epoch": 1.18, "learning_rate": 0.0012332989975629978, "loss": 0.072, "step": 46880 }, { "epoch": 1.18, "learning_rate": 0.0012329221415471195, "loss": 0.0762, "step": 46890 }, { "epoch": 1.18, "learning_rate": 0.0012325452855312415, "loss": 0.0749, "step": 46900 }, { "epoch": 1.18, "learning_rate": 0.0012321684295153632, "loss": 0.0781, "step": 46910 }, { "epoch": 1.18, "learning_rate": 0.001231791573499485, "loss": 0.0743, "step": 46920 }, { "epoch": 1.18, "learning_rate": 0.0012314147174836067, "loss": 0.0784, "step": 46930 }, { "epoch": 1.18, "learning_rate": 0.0012310378614677287, "loss": 0.0747, "step": 46940 }, { "epoch": 1.18, "learning_rate": 0.0012306610054518504, "loss": 0.0766, "step": 46950 }, { "epoch": 1.18, "learning_rate": 0.0012302841494359722, "loss": 0.0786, "step": 46960 }, { "epoch": 1.18, "learning_rate": 0.001229907293420094, "loss": 0.0787, "step": 46970 }, { "epoch": 1.18, "learning_rate": 0.0012295304374042157, "loss": 0.0791, "step": 46980 }, { "epoch": 1.18, "learning_rate": 0.0012291535813883376, "loss": 0.0738, "step": 46990 }, { "epoch": 1.18, "learning_rate": 0.0012287767253724594, "loss": 0.0722, "step": 47000 }, { "epoch": 1.18, "eval_cer": 0.665535294154447, "eval_loss": 0.06398055702447891, "eval_runtime": 90.575, "eval_samples_per_second": 110.395, "eval_steps_per_second": 6.9, "step": 47000 }, { "epoch": 1.18, "learning_rate": 0.0012283998693565811, "loss": 0.0727, "step": 47010 }, { "epoch": 1.18, "learning_rate": 0.0012280230133407029, "loss": 0.0755, "step": 47020 }, { "epoch": 1.18, "learning_rate": 0.0012276461573248248, "loss": 0.0754, "step": 47030 }, { "epoch": 1.18, "learning_rate": 0.0012272693013089466, "loss": 0.0733, "step": 47040 }, { "epoch": 1.18, "learning_rate": 0.0012268924452930685, "loss": 0.0773, "step": 47050 }, { "epoch": 1.18, "learning_rate": 0.00122651558927719, "loss": 0.0756, "step": 47060 }, { "epoch": 1.18, "learning_rate": 0.001226138733261312, "loss": 0.0774, "step": 47070 }, { "epoch": 1.18, "learning_rate": 0.0012257618772454338, "loss": 0.0743, "step": 47080 }, { "epoch": 1.18, "learning_rate": 0.0012253850212295557, "loss": 0.0749, "step": 47090 }, { "epoch": 1.18, "learning_rate": 0.0012250081652136775, "loss": 0.0756, "step": 47100 }, { "epoch": 1.18, "learning_rate": 0.0012246313091977992, "loss": 0.0776, "step": 47110 }, { "epoch": 1.18, "learning_rate": 0.001224254453181921, "loss": 0.076, "step": 47120 }, { "epoch": 1.18, "learning_rate": 0.001223877597166043, "loss": 0.0736, "step": 47130 }, { "epoch": 1.18, "learning_rate": 0.0012235007411501647, "loss": 0.0775, "step": 47140 }, { "epoch": 1.18, "learning_rate": 0.0012231238851342864, "loss": 0.0731, "step": 47150 }, { "epoch": 1.18, "learning_rate": 0.0012227470291184081, "loss": 0.0761, "step": 47160 }, { "epoch": 1.19, "learning_rate": 0.0012223701731025299, "loss": 0.076, "step": 47170 }, { "epoch": 1.19, "learning_rate": 0.0012219933170866519, "loss": 0.0743, "step": 47180 }, { "epoch": 1.19, "learning_rate": 0.0012216164610707736, "loss": 0.0743, "step": 47190 }, { "epoch": 1.19, "learning_rate": 0.0012212396050548953, "loss": 0.0728, "step": 47200 }, { "epoch": 1.19, "learning_rate": 0.001220862749039017, "loss": 0.0735, "step": 47210 }, { "epoch": 1.19, "learning_rate": 0.001220485893023139, "loss": 0.0717, "step": 47220 }, { "epoch": 1.19, "learning_rate": 0.0012201090370072608, "loss": 0.0785, "step": 47230 }, { "epoch": 1.19, "learning_rate": 0.0012197321809913825, "loss": 0.0783, "step": 47240 }, { "epoch": 1.19, "learning_rate": 0.0012193553249755043, "loss": 0.0704, "step": 47250 }, { "epoch": 1.19, "learning_rate": 0.0012189784689596262, "loss": 0.0791, "step": 47260 }, { "epoch": 1.19, "learning_rate": 0.001218601612943748, "loss": 0.074, "step": 47270 }, { "epoch": 1.19, "learning_rate": 0.0012182247569278697, "loss": 0.0769, "step": 47280 }, { "epoch": 1.19, "learning_rate": 0.0012178479009119915, "loss": 0.0742, "step": 47290 }, { "epoch": 1.19, "learning_rate": 0.0012174710448961134, "loss": 0.0785, "step": 47300 }, { "epoch": 1.19, "learning_rate": 0.0012170941888802352, "loss": 0.0742, "step": 47310 }, { "epoch": 1.19, "learning_rate": 0.0012167173328643571, "loss": 0.0744, "step": 47320 }, { "epoch": 1.19, "learning_rate": 0.0012163404768484787, "loss": 0.0743, "step": 47330 }, { "epoch": 1.19, "learning_rate": 0.0012159636208326006, "loss": 0.0762, "step": 47340 }, { "epoch": 1.19, "learning_rate": 0.0012155867648167224, "loss": 0.0755, "step": 47350 }, { "epoch": 1.19, "learning_rate": 0.0012152099088008443, "loss": 0.0765, "step": 47360 }, { "epoch": 1.19, "learning_rate": 0.001214833052784966, "loss": 0.0749, "step": 47370 }, { "epoch": 1.19, "learning_rate": 0.0012144561967690878, "loss": 0.0751, "step": 47380 }, { "epoch": 1.19, "learning_rate": 0.0012140793407532096, "loss": 0.0754, "step": 47390 }, { "epoch": 1.19, "learning_rate": 0.0012137024847373313, "loss": 0.0717, "step": 47400 }, { "epoch": 1.19, "learning_rate": 0.0012133256287214533, "loss": 0.0781, "step": 47410 }, { "epoch": 1.19, "learning_rate": 0.0012129487727055748, "loss": 0.077, "step": 47420 }, { "epoch": 1.19, "learning_rate": 0.0012125719166896968, "loss": 0.0773, "step": 47430 }, { "epoch": 1.19, "learning_rate": 0.0012121950606738185, "loss": 0.0764, "step": 47440 }, { "epoch": 1.19, "learning_rate": 0.0012118182046579405, "loss": 0.0756, "step": 47450 }, { "epoch": 1.19, "learning_rate": 0.0012114413486420622, "loss": 0.0723, "step": 47460 }, { "epoch": 1.19, "learning_rate": 0.001211064492626184, "loss": 0.0778, "step": 47470 }, { "epoch": 1.19, "learning_rate": 0.0012106876366103057, "loss": 0.0765, "step": 47480 }, { "epoch": 1.19, "learning_rate": 0.0012103107805944277, "loss": 0.0763, "step": 47490 }, { "epoch": 1.19, "learning_rate": 0.0012099339245785494, "loss": 0.0763, "step": 47500 }, { "epoch": 1.19, "eval_cer": 0.6654433791608979, "eval_loss": 0.06456325203180313, "eval_runtime": 90.7603, "eval_samples_per_second": 110.169, "eval_steps_per_second": 6.886, "step": 47500 }, { "epoch": 1.19, "learning_rate": 0.0012095570685626712, "loss": 0.0749, "step": 47510 }, { "epoch": 1.19, "learning_rate": 0.001209180212546793, "loss": 0.0746, "step": 47520 }, { "epoch": 1.19, "learning_rate": 0.0012088033565309149, "loss": 0.0762, "step": 47530 }, { "epoch": 1.19, "learning_rate": 0.0012084265005150366, "loss": 0.0732, "step": 47540 }, { "epoch": 1.19, "learning_rate": 0.0012080496444991584, "loss": 0.079, "step": 47550 }, { "epoch": 1.19, "learning_rate": 0.00120767278848328, "loss": 0.0731, "step": 47560 }, { "epoch": 1.2, "learning_rate": 0.001207295932467402, "loss": 0.0733, "step": 47570 }, { "epoch": 1.2, "learning_rate": 0.0012069190764515238, "loss": 0.0763, "step": 47580 }, { "epoch": 1.2, "learning_rate": 0.0012065422204356455, "loss": 0.0736, "step": 47590 }, { "epoch": 1.2, "learning_rate": 0.0012061653644197673, "loss": 0.0765, "step": 47600 }, { "epoch": 1.2, "learning_rate": 0.0012057885084038893, "loss": 0.0718, "step": 47610 }, { "epoch": 1.2, "learning_rate": 0.001205411652388011, "loss": 0.0769, "step": 47620 }, { "epoch": 1.2, "learning_rate": 0.0012050347963721327, "loss": 0.0729, "step": 47630 }, { "epoch": 1.2, "learning_rate": 0.0012046579403562545, "loss": 0.0775, "step": 47640 }, { "epoch": 1.2, "learning_rate": 0.0012042810843403762, "loss": 0.0743, "step": 47650 }, { "epoch": 1.2, "learning_rate": 0.0012039042283244982, "loss": 0.0771, "step": 47660 }, { "epoch": 1.2, "learning_rate": 0.00120352737230862, "loss": 0.0741, "step": 47670 }, { "epoch": 1.2, "learning_rate": 0.001203150516292742, "loss": 0.0712, "step": 47680 }, { "epoch": 1.2, "learning_rate": 0.0012027736602768634, "loss": 0.0784, "step": 47690 }, { "epoch": 1.2, "learning_rate": 0.0012023968042609854, "loss": 0.0789, "step": 47700 }, { "epoch": 1.2, "learning_rate": 0.0012020199482451071, "loss": 0.0745, "step": 47710 }, { "epoch": 1.2, "learning_rate": 0.001201643092229229, "loss": 0.0761, "step": 47720 }, { "epoch": 1.2, "learning_rate": 0.0012012662362133508, "loss": 0.0758, "step": 47730 }, { "epoch": 1.2, "learning_rate": 0.0012008893801974726, "loss": 0.0718, "step": 47740 }, { "epoch": 1.2, "learning_rate": 0.0012005125241815943, "loss": 0.0712, "step": 47750 }, { "epoch": 1.2, "learning_rate": 0.0012001356681657163, "loss": 0.0782, "step": 47760 }, { "epoch": 1.2, "learning_rate": 0.001199758812149838, "loss": 0.0786, "step": 47770 }, { "epoch": 1.2, "learning_rate": 0.0011993819561339598, "loss": 0.0755, "step": 47780 }, { "epoch": 1.2, "learning_rate": 0.0011990051001180815, "loss": 0.0767, "step": 47790 }, { "epoch": 1.2, "learning_rate": 0.0011986282441022035, "loss": 0.0734, "step": 47800 }, { "epoch": 1.2, "learning_rate": 0.0011982513880863252, "loss": 0.0749, "step": 47810 }, { "epoch": 1.2, "learning_rate": 0.001197874532070447, "loss": 0.0722, "step": 47820 }, { "epoch": 1.2, "learning_rate": 0.0011974976760545687, "loss": 0.0763, "step": 47830 }, { "epoch": 1.2, "learning_rate": 0.0011971208200386905, "loss": 0.0744, "step": 47840 }, { "epoch": 1.2, "learning_rate": 0.0011967439640228124, "loss": 0.0742, "step": 47850 }, { "epoch": 1.2, "learning_rate": 0.0011963671080069342, "loss": 0.0758, "step": 47860 }, { "epoch": 1.2, "learning_rate": 0.001195990251991056, "loss": 0.0728, "step": 47870 }, { "epoch": 1.2, "learning_rate": 0.0011956133959751777, "loss": 0.0753, "step": 47880 }, { "epoch": 1.2, "learning_rate": 0.0011952365399592996, "loss": 0.0746, "step": 47890 }, { "epoch": 1.2, "learning_rate": 0.0011948596839434214, "loss": 0.0771, "step": 47900 }, { "epoch": 1.2, "learning_rate": 0.0011944828279275431, "loss": 0.0751, "step": 47910 }, { "epoch": 1.2, "learning_rate": 0.0011941059719116649, "loss": 0.0762, "step": 47920 }, { "epoch": 1.2, "learning_rate": 0.0011937291158957868, "loss": 0.0777, "step": 47930 }, { "epoch": 1.2, "learning_rate": 0.0011933522598799086, "loss": 0.0739, "step": 47940 }, { "epoch": 1.2, "learning_rate": 0.0011929754038640305, "loss": 0.0722, "step": 47950 }, { "epoch": 1.2, "learning_rate": 0.001192598547848152, "loss": 0.0783, "step": 47960 }, { "epoch": 1.21, "learning_rate": 0.001192221691832274, "loss": 0.0764, "step": 47970 }, { "epoch": 1.21, "learning_rate": 0.0011918448358163958, "loss": 0.0771, "step": 47980 }, { "epoch": 1.21, "learning_rate": 0.0011914679798005177, "loss": 0.0754, "step": 47990 }, { "epoch": 1.21, "learning_rate": 0.0011910911237846392, "loss": 0.0766, "step": 48000 }, { "epoch": 1.21, "eval_cer": 0.6658129640564252, "eval_loss": 0.06356838345527649, "eval_runtime": 90.7662, "eval_samples_per_second": 110.162, "eval_steps_per_second": 6.886, "step": 48000 }, { "epoch": 1.21, "learning_rate": 0.0011907142677687612, "loss": 0.076, "step": 48010 }, { "epoch": 1.21, "learning_rate": 0.001190337411752883, "loss": 0.0752, "step": 48020 }, { "epoch": 1.21, "learning_rate": 0.001189960555737005, "loss": 0.0744, "step": 48030 }, { "epoch": 1.21, "learning_rate": 0.0011895836997211267, "loss": 0.0683, "step": 48040 }, { "epoch": 1.21, "learning_rate": 0.0011892068437052484, "loss": 0.0783, "step": 48050 }, { "epoch": 1.21, "learning_rate": 0.0011888299876893701, "loss": 0.0759, "step": 48060 }, { "epoch": 1.21, "learning_rate": 0.001188453131673492, "loss": 0.0764, "step": 48070 }, { "epoch": 1.21, "learning_rate": 0.0011880762756576139, "loss": 0.073, "step": 48080 }, { "epoch": 1.21, "learning_rate": 0.0011876994196417356, "loss": 0.0721, "step": 48090 }, { "epoch": 1.21, "learning_rate": 0.0011873225636258573, "loss": 0.073, "step": 48100 }, { "epoch": 1.21, "learning_rate": 0.001186945707609979, "loss": 0.0765, "step": 48110 }, { "epoch": 1.21, "learning_rate": 0.001186568851594101, "loss": 0.0761, "step": 48120 }, { "epoch": 1.21, "learning_rate": 0.0011861919955782228, "loss": 0.0743, "step": 48130 }, { "epoch": 1.21, "learning_rate": 0.0011858151395623445, "loss": 0.0775, "step": 48140 }, { "epoch": 1.21, "learning_rate": 0.0011854382835464663, "loss": 0.0735, "step": 48150 }, { "epoch": 1.21, "learning_rate": 0.0011850614275305882, "loss": 0.0763, "step": 48160 }, { "epoch": 1.21, "learning_rate": 0.00118468457151471, "loss": 0.0743, "step": 48170 }, { "epoch": 1.21, "learning_rate": 0.0011843077154988317, "loss": 0.0745, "step": 48180 }, { "epoch": 1.21, "learning_rate": 0.0011839308594829535, "loss": 0.0743, "step": 48190 }, { "epoch": 1.21, "learning_rate": 0.0011835540034670754, "loss": 0.0788, "step": 48200 }, { "epoch": 1.21, "learning_rate": 0.0011831771474511972, "loss": 0.0773, "step": 48210 }, { "epoch": 1.21, "learning_rate": 0.001182800291435319, "loss": 0.075, "step": 48220 }, { "epoch": 1.21, "learning_rate": 0.0011824234354194407, "loss": 0.0726, "step": 48230 }, { "epoch": 1.21, "learning_rate": 0.0011820465794035626, "loss": 0.0738, "step": 48240 }, { "epoch": 1.21, "learning_rate": 0.0011816697233876844, "loss": 0.073, "step": 48250 }, { "epoch": 1.21, "learning_rate": 0.0011812928673718063, "loss": 0.0726, "step": 48260 }, { "epoch": 1.21, "learning_rate": 0.0011809160113559279, "loss": 0.0748, "step": 48270 }, { "epoch": 1.21, "learning_rate": 0.0011805391553400496, "loss": 0.0738, "step": 48280 }, { "epoch": 1.21, "learning_rate": 0.0011801622993241716, "loss": 0.0741, "step": 48290 }, { "epoch": 1.21, "learning_rate": 0.0011797854433082933, "loss": 0.076, "step": 48300 }, { "epoch": 1.21, "learning_rate": 0.0011794085872924153, "loss": 0.0777, "step": 48310 }, { "epoch": 1.21, "learning_rate": 0.0011790317312765368, "loss": 0.0754, "step": 48320 }, { "epoch": 1.21, "learning_rate": 0.0011786548752606588, "loss": 0.0725, "step": 48330 }, { "epoch": 1.21, "learning_rate": 0.0011782780192447805, "loss": 0.0726, "step": 48340 }, { "epoch": 1.21, "learning_rate": 0.0011779011632289025, "loss": 0.0746, "step": 48350 }, { "epoch": 1.21, "learning_rate": 0.0011775243072130242, "loss": 0.0734, "step": 48360 }, { "epoch": 1.22, "learning_rate": 0.001177147451197146, "loss": 0.076, "step": 48370 }, { "epoch": 1.22, "learning_rate": 0.0011767705951812677, "loss": 0.0757, "step": 48380 }, { "epoch": 1.22, "learning_rate": 0.0011763937391653897, "loss": 0.0746, "step": 48390 }, { "epoch": 1.22, "learning_rate": 0.0011760168831495114, "loss": 0.0745, "step": 48400 }, { "epoch": 1.22, "learning_rate": 0.0011756400271336332, "loss": 0.0709, "step": 48410 }, { "epoch": 1.22, "learning_rate": 0.001175263171117755, "loss": 0.0751, "step": 48420 }, { "epoch": 1.22, "learning_rate": 0.0011748863151018769, "loss": 0.0737, "step": 48430 }, { "epoch": 1.22, "learning_rate": 0.0011745094590859986, "loss": 0.0743, "step": 48440 }, { "epoch": 1.22, "learning_rate": 0.0011741326030701204, "loss": 0.074, "step": 48450 }, { "epoch": 1.22, "learning_rate": 0.001173755747054242, "loss": 0.0747, "step": 48460 }, { "epoch": 1.22, "learning_rate": 0.001173378891038364, "loss": 0.0754, "step": 48470 }, { "epoch": 1.22, "learning_rate": 0.0011730020350224858, "loss": 0.0741, "step": 48480 }, { "epoch": 1.22, "learning_rate": 0.0011726251790066076, "loss": 0.0728, "step": 48490 }, { "epoch": 1.22, "learning_rate": 0.0011722483229907293, "loss": 0.0774, "step": 48500 }, { "epoch": 1.22, "eval_cer": 0.6654024745826169, "eval_loss": 0.06362287700176239, "eval_runtime": 90.7928, "eval_samples_per_second": 110.13, "eval_steps_per_second": 6.884, "step": 48500 }, { "epoch": 1.22, "learning_rate": 0.001171871466974851, "loss": 0.0727, "step": 48510 }, { "epoch": 1.22, "learning_rate": 0.001171494610958973, "loss": 0.0757, "step": 48520 }, { "epoch": 1.22, "learning_rate": 0.0011711177549430947, "loss": 0.0747, "step": 48530 }, { "epoch": 1.22, "learning_rate": 0.0011707408989272165, "loss": 0.0717, "step": 48540 }, { "epoch": 1.22, "learning_rate": 0.0011703640429113382, "loss": 0.0726, "step": 48550 }, { "epoch": 1.22, "learning_rate": 0.0011699871868954602, "loss": 0.0759, "step": 48560 }, { "epoch": 1.22, "learning_rate": 0.001169610330879582, "loss": 0.0735, "step": 48570 }, { "epoch": 1.22, "learning_rate": 0.0011692334748637037, "loss": 0.0753, "step": 48580 }, { "epoch": 1.22, "learning_rate": 0.0011688566188478254, "loss": 0.0756, "step": 48590 }, { "epoch": 1.22, "learning_rate": 0.0011684797628319474, "loss": 0.077, "step": 48600 }, { "epoch": 1.22, "learning_rate": 0.0011681029068160691, "loss": 0.0771, "step": 48610 }, { "epoch": 1.22, "learning_rate": 0.001167726050800191, "loss": 0.0744, "step": 48620 }, { "epoch": 1.22, "learning_rate": 0.0011673491947843126, "loss": 0.0755, "step": 48630 }, { "epoch": 1.22, "learning_rate": 0.0011669723387684346, "loss": 0.0741, "step": 48640 }, { "epoch": 1.22, "learning_rate": 0.0011665954827525563, "loss": 0.0739, "step": 48650 }, { "epoch": 1.22, "learning_rate": 0.0011662186267366783, "loss": 0.0797, "step": 48660 }, { "epoch": 1.22, "learning_rate": 0.0011658417707208, "loss": 0.0767, "step": 48670 }, { "epoch": 1.22, "learning_rate": 0.0011654649147049218, "loss": 0.0716, "step": 48680 }, { "epoch": 1.22, "learning_rate": 0.0011650880586890435, "loss": 0.074, "step": 48690 }, { "epoch": 1.22, "learning_rate": 0.0011647112026731655, "loss": 0.0739, "step": 48700 }, { "epoch": 1.22, "learning_rate": 0.0011643343466572872, "loss": 0.0761, "step": 48710 }, { "epoch": 1.22, "learning_rate": 0.001163957490641409, "loss": 0.0747, "step": 48720 }, { "epoch": 1.22, "learning_rate": 0.0011635806346255307, "loss": 0.0743, "step": 48730 }, { "epoch": 1.22, "learning_rate": 0.0011632037786096525, "loss": 0.077, "step": 48740 }, { "epoch": 1.22, "learning_rate": 0.0011628269225937744, "loss": 0.0733, "step": 48750 }, { "epoch": 1.23, "learning_rate": 0.0011624500665778962, "loss": 0.0738, "step": 48760 }, { "epoch": 1.23, "learning_rate": 0.001162073210562018, "loss": 0.0743, "step": 48770 }, { "epoch": 1.23, "learning_rate": 0.0011616963545461397, "loss": 0.0693, "step": 48780 }, { "epoch": 1.23, "learning_rate": 0.0011613194985302616, "loss": 0.0751, "step": 48790 }, { "epoch": 1.23, "learning_rate": 0.0011609426425143834, "loss": 0.0763, "step": 48800 }, { "epoch": 1.23, "learning_rate": 0.0011605657864985051, "loss": 0.0735, "step": 48810 }, { "epoch": 1.23, "learning_rate": 0.0011601889304826269, "loss": 0.072, "step": 48820 }, { "epoch": 1.23, "learning_rate": 0.0011598120744667488, "loss": 0.0746, "step": 48830 }, { "epoch": 1.23, "learning_rate": 0.0011594352184508706, "loss": 0.0719, "step": 48840 }, { "epoch": 1.23, "learning_rate": 0.0011590583624349923, "loss": 0.0727, "step": 48850 }, { "epoch": 1.23, "learning_rate": 0.001158681506419114, "loss": 0.0714, "step": 48860 }, { "epoch": 1.23, "learning_rate": 0.001158304650403236, "loss": 0.0733, "step": 48870 }, { "epoch": 1.23, "learning_rate": 0.0011579277943873578, "loss": 0.0756, "step": 48880 }, { "epoch": 1.23, "learning_rate": 0.0011575509383714797, "loss": 0.0751, "step": 48890 }, { "epoch": 1.23, "learning_rate": 0.0011571740823556013, "loss": 0.0766, "step": 48900 }, { "epoch": 1.23, "learning_rate": 0.0011567972263397232, "loss": 0.0733, "step": 48910 }, { "epoch": 1.23, "learning_rate": 0.001156420370323845, "loss": 0.0753, "step": 48920 }, { "epoch": 1.23, "learning_rate": 0.001156043514307967, "loss": 0.0745, "step": 48930 }, { "epoch": 1.23, "learning_rate": 0.0011556666582920887, "loss": 0.0714, "step": 48940 }, { "epoch": 1.23, "learning_rate": 0.0011552898022762102, "loss": 0.0719, "step": 48950 }, { "epoch": 1.23, "learning_rate": 0.0011549129462603322, "loss": 0.0776, "step": 48960 }, { "epoch": 1.23, "learning_rate": 0.001154536090244454, "loss": 0.0732, "step": 48970 }, { "epoch": 1.23, "learning_rate": 0.0011541592342285759, "loss": 0.073, "step": 48980 }, { "epoch": 1.23, "learning_rate": 0.0011537823782126974, "loss": 0.0719, "step": 48990 }, { "epoch": 1.23, "learning_rate": 0.0011534055221968193, "loss": 0.0759, "step": 49000 }, { "epoch": 1.23, "eval_cer": 0.6653995872006206, "eval_loss": 0.06333644688129425, "eval_runtime": 90.5934, "eval_samples_per_second": 110.372, "eval_steps_per_second": 6.899, "step": 49000 }, { "epoch": 1.23, "learning_rate": 0.001153028666180941, "loss": 0.0753, "step": 49010 }, { "epoch": 1.23, "learning_rate": 0.001152651810165063, "loss": 0.0756, "step": 49020 }, { "epoch": 1.23, "learning_rate": 0.0011522749541491848, "loss": 0.075, "step": 49030 }, { "epoch": 1.23, "learning_rate": 0.0011518980981333065, "loss": 0.0776, "step": 49040 }, { "epoch": 1.23, "learning_rate": 0.0011515212421174283, "loss": 0.0742, "step": 49050 }, { "epoch": 1.23, "learning_rate": 0.0011511443861015502, "loss": 0.0702, "step": 49060 }, { "epoch": 1.23, "learning_rate": 0.001150767530085672, "loss": 0.0716, "step": 49070 }, { "epoch": 1.23, "learning_rate": 0.0011503906740697937, "loss": 0.0765, "step": 49080 }, { "epoch": 1.23, "learning_rate": 0.0011500138180539155, "loss": 0.0757, "step": 49090 }, { "epoch": 1.23, "learning_rate": 0.0011496369620380374, "loss": 0.0748, "step": 49100 }, { "epoch": 1.23, "learning_rate": 0.0011492601060221592, "loss": 0.0748, "step": 49110 }, { "epoch": 1.23, "learning_rate": 0.001148883250006281, "loss": 0.074, "step": 49120 }, { "epoch": 1.23, "learning_rate": 0.0011485063939904027, "loss": 0.0707, "step": 49130 }, { "epoch": 1.23, "learning_rate": 0.0011481295379745246, "loss": 0.0753, "step": 49140 }, { "epoch": 1.23, "learning_rate": 0.0011477526819586464, "loss": 0.0722, "step": 49150 }, { "epoch": 1.24, "learning_rate": 0.0011473758259427681, "loss": 0.0706, "step": 49160 }, { "epoch": 1.24, "learning_rate": 0.0011469989699268899, "loss": 0.0758, "step": 49170 }, { "epoch": 1.24, "learning_rate": 0.0011466221139110116, "loss": 0.0752, "step": 49180 }, { "epoch": 1.24, "learning_rate": 0.0011462452578951336, "loss": 0.0752, "step": 49190 }, { "epoch": 1.24, "learning_rate": 0.0011458684018792553, "loss": 0.0733, "step": 49200 }, { "epoch": 1.24, "learning_rate": 0.001145491545863377, "loss": 0.0745, "step": 49210 }, { "epoch": 1.24, "learning_rate": 0.0011451146898474988, "loss": 0.0728, "step": 49220 }, { "epoch": 1.24, "learning_rate": 0.0011447378338316208, "loss": 0.0768, "step": 49230 }, { "epoch": 1.24, "learning_rate": 0.0011443609778157425, "loss": 0.0731, "step": 49240 }, { "epoch": 1.24, "learning_rate": 0.0011439841217998645, "loss": 0.0727, "step": 49250 }, { "epoch": 1.24, "learning_rate": 0.001143607265783986, "loss": 0.0718, "step": 49260 }, { "epoch": 1.24, "learning_rate": 0.001143230409768108, "loss": 0.076, "step": 49270 }, { "epoch": 1.24, "learning_rate": 0.0011428535537522297, "loss": 0.0717, "step": 49280 }, { "epoch": 1.24, "learning_rate": 0.0011424766977363517, "loss": 0.0729, "step": 49290 }, { "epoch": 1.24, "learning_rate": 0.0011420998417204734, "loss": 0.0742, "step": 49300 }, { "epoch": 1.24, "learning_rate": 0.0011417229857045952, "loss": 0.0748, "step": 49310 }, { "epoch": 1.24, "learning_rate": 0.001141346129688717, "loss": 0.0772, "step": 49320 }, { "epoch": 1.24, "learning_rate": 0.0011409692736728389, "loss": 0.075, "step": 49330 }, { "epoch": 1.24, "learning_rate": 0.0011405924176569606, "loss": 0.074, "step": 49340 }, { "epoch": 1.24, "learning_rate": 0.0011402155616410824, "loss": 0.0742, "step": 49350 }, { "epoch": 1.24, "learning_rate": 0.001139838705625204, "loss": 0.0732, "step": 49360 }, { "epoch": 1.24, "learning_rate": 0.001139461849609326, "loss": 0.0739, "step": 49370 }, { "epoch": 1.24, "learning_rate": 0.0011390849935934478, "loss": 0.0716, "step": 49380 }, { "epoch": 1.24, "learning_rate": 0.0011387081375775696, "loss": 0.0743, "step": 49390 }, { "epoch": 1.24, "learning_rate": 0.0011383312815616913, "loss": 0.0735, "step": 49400 }, { "epoch": 1.24, "learning_rate": 0.001137954425545813, "loss": 0.074, "step": 49410 }, { "epoch": 1.24, "learning_rate": 0.001137577569529935, "loss": 0.0767, "step": 49420 }, { "epoch": 1.24, "learning_rate": 0.0011372007135140568, "loss": 0.0734, "step": 49430 }, { "epoch": 1.24, "learning_rate": 0.0011368238574981785, "loss": 0.0748, "step": 49440 }, { "epoch": 1.24, "learning_rate": 0.0011364470014823002, "loss": 0.0728, "step": 49450 }, { "epoch": 1.24, "learning_rate": 0.0011360701454664222, "loss": 0.0757, "step": 49460 }, { "epoch": 1.24, "learning_rate": 0.001135693289450544, "loss": 0.0732, "step": 49470 }, { "epoch": 1.24, "learning_rate": 0.0011353164334346657, "loss": 0.0748, "step": 49480 }, { "epoch": 1.24, "learning_rate": 0.0011349395774187874, "loss": 0.0749, "step": 49490 }, { "epoch": 1.24, "learning_rate": 0.0011345627214029094, "loss": 0.0779, "step": 49500 }, { "epoch": 1.24, "eval_cer": 0.6658298071180704, "eval_loss": 0.06252450495958328, "eval_runtime": 90.8892, "eval_samples_per_second": 110.013, "eval_steps_per_second": 6.877, "step": 49500 }, { "epoch": 1.24, "learning_rate": 0.0011341858653870311, "loss": 0.0753, "step": 49510 }, { "epoch": 1.24, "learning_rate": 0.001133809009371153, "loss": 0.0728, "step": 49520 }, { "epoch": 1.24, "learning_rate": 0.0011334321533552746, "loss": 0.0729, "step": 49530 }, { "epoch": 1.24, "learning_rate": 0.0011330552973393966, "loss": 0.0739, "step": 49540 }, { "epoch": 1.24, "learning_rate": 0.0011326784413235183, "loss": 0.0728, "step": 49550 }, { "epoch": 1.25, "learning_rate": 0.0011323015853076403, "loss": 0.0718, "step": 49560 }, { "epoch": 1.25, "learning_rate": 0.0011319247292917618, "loss": 0.0732, "step": 49570 }, { "epoch": 1.25, "learning_rate": 0.0011315478732758838, "loss": 0.07, "step": 49580 }, { "epoch": 1.25, "learning_rate": 0.0011311710172600055, "loss": 0.0729, "step": 49590 }, { "epoch": 1.25, "learning_rate": 0.0011307941612441275, "loss": 0.0758, "step": 49600 }, { "epoch": 1.25, "learning_rate": 0.0011304173052282492, "loss": 0.0699, "step": 49610 }, { "epoch": 1.25, "learning_rate": 0.0011300404492123708, "loss": 0.0747, "step": 49620 }, { "epoch": 1.25, "learning_rate": 0.0011296635931964927, "loss": 0.0734, "step": 49630 }, { "epoch": 1.25, "learning_rate": 0.0011292867371806145, "loss": 0.0766, "step": 49640 }, { "epoch": 1.25, "learning_rate": 0.0011289098811647364, "loss": 0.07, "step": 49650 }, { "epoch": 1.25, "learning_rate": 0.0011285330251488582, "loss": 0.0743, "step": 49660 }, { "epoch": 1.25, "learning_rate": 0.00112815616913298, "loss": 0.0731, "step": 49670 }, { "epoch": 1.25, "learning_rate": 0.0011277793131171017, "loss": 0.0761, "step": 49680 }, { "epoch": 1.25, "learning_rate": 0.0011274024571012236, "loss": 0.0764, "step": 49690 }, { "epoch": 1.25, "learning_rate": 0.0011270256010853454, "loss": 0.0761, "step": 49700 }, { "epoch": 1.25, "learning_rate": 0.0011266487450694671, "loss": 0.0736, "step": 49710 }, { "epoch": 1.25, "learning_rate": 0.0011262718890535889, "loss": 0.0747, "step": 49720 }, { "epoch": 1.25, "learning_rate": 0.0011258950330377108, "loss": 0.075, "step": 49730 }, { "epoch": 1.25, "learning_rate": 0.0011255181770218326, "loss": 0.0718, "step": 49740 }, { "epoch": 1.25, "learning_rate": 0.0011251413210059543, "loss": 0.0731, "step": 49750 }, { "epoch": 1.25, "learning_rate": 0.001124764464990076, "loss": 0.0732, "step": 49760 }, { "epoch": 1.25, "learning_rate": 0.001124387608974198, "loss": 0.0723, "step": 49770 }, { "epoch": 1.25, "learning_rate": 0.0011240107529583198, "loss": 0.0742, "step": 49780 }, { "epoch": 1.25, "learning_rate": 0.0011236338969424415, "loss": 0.0738, "step": 49790 }, { "epoch": 1.25, "learning_rate": 0.0011232570409265633, "loss": 0.0736, "step": 49800 }, { "epoch": 1.25, "learning_rate": 0.0011228801849106852, "loss": 0.0723, "step": 49810 }, { "epoch": 1.25, "learning_rate": 0.001122503328894807, "loss": 0.0717, "step": 49820 }, { "epoch": 1.25, "learning_rate": 0.001122126472878929, "loss": 0.0742, "step": 49830 }, { "epoch": 1.25, "learning_rate": 0.0011217496168630505, "loss": 0.0732, "step": 49840 }, { "epoch": 1.25, "learning_rate": 0.0011213727608471722, "loss": 0.0749, "step": 49850 }, { "epoch": 1.25, "learning_rate": 0.0011209959048312942, "loss": 0.0745, "step": 49860 }, { "epoch": 1.25, "learning_rate": 0.001120619048815416, "loss": 0.0701, "step": 49870 }, { "epoch": 1.25, "learning_rate": 0.0011202421927995379, "loss": 0.0746, "step": 49880 }, { "epoch": 1.25, "learning_rate": 0.0011198653367836594, "loss": 0.0732, "step": 49890 }, { "epoch": 1.25, "learning_rate": 0.0011194884807677814, "loss": 0.0706, "step": 49900 }, { "epoch": 1.25, "learning_rate": 0.001119111624751903, "loss": 0.0709, "step": 49910 }, { "epoch": 1.25, "learning_rate": 0.001118734768736025, "loss": 0.0755, "step": 49920 }, { "epoch": 1.25, "learning_rate": 0.0011183579127201468, "loss": 0.0707, "step": 49930 }, { "epoch": 1.25, "learning_rate": 0.0011179810567042685, "loss": 0.0744, "step": 49940 }, { "epoch": 1.25, "learning_rate": 0.0011176042006883903, "loss": 0.0713, "step": 49950 }, { "epoch": 1.26, "learning_rate": 0.0011172273446725123, "loss": 0.0766, "step": 49960 }, { "epoch": 1.26, "learning_rate": 0.001116850488656634, "loss": 0.0723, "step": 49970 }, { "epoch": 1.26, "learning_rate": 0.0011164736326407557, "loss": 0.0761, "step": 49980 }, { "epoch": 1.26, "learning_rate": 0.0011160967766248775, "loss": 0.0763, "step": 49990 }, { "epoch": 1.26, "learning_rate": 0.0011157199206089994, "loss": 0.074, "step": 50000 }, { "epoch": 1.26, "eval_cer": 0.6653543515493451, "eval_loss": 0.06283344328403473, "eval_runtime": 90.7413, "eval_samples_per_second": 110.192, "eval_steps_per_second": 6.888, "step": 50000 }, { "epoch": 1.26, "learning_rate": 0.0011153430645931212, "loss": 0.0736, "step": 50010 }, { "epoch": 1.26, "learning_rate": 0.001114966208577243, "loss": 0.0729, "step": 50020 }, { "epoch": 1.26, "learning_rate": 0.0011145893525613647, "loss": 0.0761, "step": 50030 }, { "epoch": 1.26, "learning_rate": 0.0011142124965454866, "loss": 0.0715, "step": 50040 }, { "epoch": 1.26, "learning_rate": 0.0011138356405296084, "loss": 0.07, "step": 50050 }, { "epoch": 1.26, "learning_rate": 0.0011134587845137301, "loss": 0.076, "step": 50060 }, { "epoch": 1.26, "learning_rate": 0.0011130819284978519, "loss": 0.0735, "step": 50070 }, { "epoch": 1.26, "learning_rate": 0.0011127050724819736, "loss": 0.0744, "step": 50080 }, { "epoch": 1.26, "learning_rate": 0.0011123282164660956, "loss": 0.0741, "step": 50090 }, { "epoch": 1.26, "learning_rate": 0.0011119513604502173, "loss": 0.0733, "step": 50100 }, { "epoch": 1.26, "learning_rate": 0.001111574504434339, "loss": 0.0721, "step": 50110 }, { "epoch": 1.26, "learning_rate": 0.0011111976484184608, "loss": 0.0716, "step": 50120 }, { "epoch": 1.26, "learning_rate": 0.0011108207924025828, "loss": 0.0744, "step": 50130 }, { "epoch": 1.26, "learning_rate": 0.0011104439363867045, "loss": 0.0752, "step": 50140 }, { "epoch": 1.26, "learning_rate": 0.0011100670803708263, "loss": 0.0764, "step": 50150 }, { "epoch": 1.26, "learning_rate": 0.001109690224354948, "loss": 0.0725, "step": 50160 }, { "epoch": 1.26, "learning_rate": 0.00110931336833907, "loss": 0.0721, "step": 50170 }, { "epoch": 1.26, "learning_rate": 0.0011089365123231917, "loss": 0.0712, "step": 50180 }, { "epoch": 1.26, "learning_rate": 0.0011085596563073137, "loss": 0.0699, "step": 50190 }, { "epoch": 1.26, "learning_rate": 0.0011081828002914352, "loss": 0.0734, "step": 50200 }, { "epoch": 1.26, "learning_rate": 0.0011078059442755572, "loss": 0.0749, "step": 50210 }, { "epoch": 1.26, "learning_rate": 0.001107429088259679, "loss": 0.0726, "step": 50220 }, { "epoch": 1.26, "learning_rate": 0.0011070522322438009, "loss": 0.0707, "step": 50230 }, { "epoch": 1.26, "learning_rate": 0.0011066753762279226, "loss": 0.076, "step": 50240 }, { "epoch": 1.26, "learning_rate": 0.0011062985202120444, "loss": 0.0771, "step": 50250 }, { "epoch": 1.26, "learning_rate": 0.0011059216641961661, "loss": 0.0719, "step": 50260 }, { "epoch": 1.26, "learning_rate": 0.001105544808180288, "loss": 0.0722, "step": 50270 }, { "epoch": 1.26, "learning_rate": 0.0011051679521644098, "loss": 0.0743, "step": 50280 }, { "epoch": 1.26, "learning_rate": 0.0011047910961485316, "loss": 0.0727, "step": 50290 }, { "epoch": 1.26, "learning_rate": 0.0011044142401326533, "loss": 0.0727, "step": 50300 }, { "epoch": 1.26, "learning_rate": 0.001104037384116775, "loss": 0.0709, "step": 50310 }, { "epoch": 1.26, "learning_rate": 0.001103660528100897, "loss": 0.076, "step": 50320 }, { "epoch": 1.26, "learning_rate": 0.0011032836720850188, "loss": 0.0754, "step": 50330 }, { "epoch": 1.26, "learning_rate": 0.0011029068160691405, "loss": 0.0709, "step": 50340 }, { "epoch": 1.26, "learning_rate": 0.0011025299600532622, "loss": 0.0722, "step": 50350 }, { "epoch": 1.27, "learning_rate": 0.0011021531040373842, "loss": 0.072, "step": 50360 }, { "epoch": 1.27, "learning_rate": 0.001101776248021506, "loss": 0.0725, "step": 50370 }, { "epoch": 1.27, "learning_rate": 0.0011013993920056277, "loss": 0.0738, "step": 50380 }, { "epoch": 1.27, "learning_rate": 0.0011010225359897494, "loss": 0.0783, "step": 50390 }, { "epoch": 1.27, "learning_rate": 0.0011006456799738714, "loss": 0.0732, "step": 50400 }, { "epoch": 1.27, "learning_rate": 0.0011002688239579931, "loss": 0.0703, "step": 50410 }, { "epoch": 1.27, "learning_rate": 0.0010998919679421149, "loss": 0.0755, "step": 50420 }, { "epoch": 1.27, "learning_rate": 0.0010995151119262366, "loss": 0.0727, "step": 50430 }, { "epoch": 1.27, "learning_rate": 0.0010991382559103586, "loss": 0.0755, "step": 50440 }, { "epoch": 1.27, "learning_rate": 0.0010987613998944803, "loss": 0.0723, "step": 50450 }, { "epoch": 1.27, "learning_rate": 0.0010983845438786023, "loss": 0.0739, "step": 50460 }, { "epoch": 1.27, "learning_rate": 0.0010980076878627238, "loss": 0.0737, "step": 50470 }, { "epoch": 1.27, "learning_rate": 0.0010976308318468458, "loss": 0.0738, "step": 50480 }, { "epoch": 1.27, "learning_rate": 0.0010972539758309675, "loss": 0.0722, "step": 50490 }, { "epoch": 1.27, "learning_rate": 0.0010968771198150895, "loss": 0.0761, "step": 50500 }, { "epoch": 1.27, "eval_cer": 0.665603628861693, "eval_loss": 0.062332626432180405, "eval_runtime": 90.8939, "eval_samples_per_second": 110.007, "eval_steps_per_second": 6.876, "step": 50500 }, { "epoch": 1.27, "learning_rate": 0.0010965002637992112, "loss": 0.0728, "step": 50510 }, { "epoch": 1.27, "learning_rate": 0.0010961234077833328, "loss": 0.0722, "step": 50520 }, { "epoch": 1.27, "learning_rate": 0.0010957465517674547, "loss": 0.075, "step": 50530 }, { "epoch": 1.27, "learning_rate": 0.0010953696957515765, "loss": 0.0712, "step": 50540 }, { "epoch": 1.27, "learning_rate": 0.0010949928397356984, "loss": 0.0712, "step": 50550 }, { "epoch": 1.27, "learning_rate": 0.00109461598371982, "loss": 0.0739, "step": 50560 }, { "epoch": 1.27, "learning_rate": 0.001094239127703942, "loss": 0.0758, "step": 50570 }, { "epoch": 1.27, "learning_rate": 0.0010938622716880637, "loss": 0.0721, "step": 50580 }, { "epoch": 1.27, "learning_rate": 0.0010934854156721856, "loss": 0.0738, "step": 50590 }, { "epoch": 1.27, "learning_rate": 0.0010931085596563074, "loss": 0.0707, "step": 50600 }, { "epoch": 1.27, "learning_rate": 0.0010927317036404291, "loss": 0.0731, "step": 50610 }, { "epoch": 1.27, "learning_rate": 0.0010923548476245509, "loss": 0.073, "step": 50620 }, { "epoch": 1.27, "learning_rate": 0.0010919779916086728, "loss": 0.0762, "step": 50630 }, { "epoch": 1.27, "learning_rate": 0.0010916011355927946, "loss": 0.0744, "step": 50640 }, { "epoch": 1.27, "learning_rate": 0.0010912242795769163, "loss": 0.0736, "step": 50650 }, { "epoch": 1.27, "learning_rate": 0.001090847423561038, "loss": 0.0742, "step": 50660 }, { "epoch": 1.27, "learning_rate": 0.00109047056754516, "loss": 0.0778, "step": 50670 }, { "epoch": 1.27, "learning_rate": 0.0010900937115292818, "loss": 0.0742, "step": 50680 }, { "epoch": 1.27, "learning_rate": 0.0010897168555134035, "loss": 0.0732, "step": 50690 }, { "epoch": 1.27, "learning_rate": 0.0010893399994975253, "loss": 0.0738, "step": 50700 }, { "epoch": 1.27, "learning_rate": 0.0010889631434816472, "loss": 0.0721, "step": 50710 }, { "epoch": 1.27, "learning_rate": 0.001088586287465769, "loss": 0.0775, "step": 50720 }, { "epoch": 1.27, "learning_rate": 0.0010882094314498907, "loss": 0.0732, "step": 50730 }, { "epoch": 1.27, "learning_rate": 0.0010878325754340125, "loss": 0.0718, "step": 50740 }, { "epoch": 1.28, "learning_rate": 0.0010874557194181342, "loss": 0.0709, "step": 50750 }, { "epoch": 1.28, "learning_rate": 0.0010870788634022562, "loss": 0.0746, "step": 50760 }, { "epoch": 1.28, "learning_rate": 0.001086702007386378, "loss": 0.0775, "step": 50770 }, { "epoch": 1.28, "learning_rate": 0.0010863251513704996, "loss": 0.0724, "step": 50780 }, { "epoch": 1.28, "learning_rate": 0.0010859482953546214, "loss": 0.0755, "step": 50790 }, { "epoch": 1.28, "learning_rate": 0.0010855714393387434, "loss": 0.0748, "step": 50800 }, { "epoch": 1.28, "learning_rate": 0.001085194583322865, "loss": 0.0774, "step": 50810 }, { "epoch": 1.28, "learning_rate": 0.001084817727306987, "loss": 0.0721, "step": 50820 }, { "epoch": 1.28, "learning_rate": 0.0010844408712911086, "loss": 0.075, "step": 50830 }, { "epoch": 1.28, "learning_rate": 0.0010840640152752306, "loss": 0.0717, "step": 50840 }, { "epoch": 1.28, "learning_rate": 0.0010836871592593523, "loss": 0.072, "step": 50850 }, { "epoch": 1.28, "learning_rate": 0.0010833103032434743, "loss": 0.072, "step": 50860 }, { "epoch": 1.28, "learning_rate": 0.001082933447227596, "loss": 0.0769, "step": 50870 }, { "epoch": 1.28, "learning_rate": 0.0010825565912117177, "loss": 0.0747, "step": 50880 }, { "epoch": 1.28, "learning_rate": 0.0010821797351958395, "loss": 0.0706, "step": 50890 }, { "epoch": 1.28, "learning_rate": 0.0010818028791799615, "loss": 0.0691, "step": 50900 }, { "epoch": 1.28, "learning_rate": 0.0010814260231640832, "loss": 0.0739, "step": 50910 }, { "epoch": 1.28, "learning_rate": 0.001081049167148205, "loss": 0.0745, "step": 50920 }, { "epoch": 1.28, "learning_rate": 0.0010806723111323267, "loss": 0.0725, "step": 50930 }, { "epoch": 1.28, "learning_rate": 0.0010802954551164486, "loss": 0.0748, "step": 50940 }, { "epoch": 1.28, "learning_rate": 0.0010799185991005704, "loss": 0.0718, "step": 50950 }, { "epoch": 1.28, "learning_rate": 0.0010795417430846921, "loss": 0.0747, "step": 50960 }, { "epoch": 1.28, "learning_rate": 0.0010791648870688139, "loss": 0.0689, "step": 50970 }, { "epoch": 1.28, "learning_rate": 0.0010787880310529356, "loss": 0.0724, "step": 50980 }, { "epoch": 1.28, "learning_rate": 0.0010784111750370576, "loss": 0.0725, "step": 50990 }, { "epoch": 1.28, "learning_rate": 0.0010780343190211793, "loss": 0.0763, "step": 51000 }, { "epoch": 1.28, "eval_cer": 0.6655237446264618, "eval_loss": 0.06174508482217789, "eval_runtime": 90.7553, "eval_samples_per_second": 110.175, "eval_steps_per_second": 6.887, "step": 51000 }, { "epoch": 1.28, "learning_rate": 0.001077657463005301, "loss": 0.0719, "step": 51010 }, { "epoch": 1.28, "learning_rate": 0.0010772806069894228, "loss": 0.0751, "step": 51020 }, { "epoch": 1.28, "learning_rate": 0.0010769037509735448, "loss": 0.0737, "step": 51030 }, { "epoch": 1.28, "learning_rate": 0.0010765268949576665, "loss": 0.0771, "step": 51040 }, { "epoch": 1.28, "learning_rate": 0.0010761500389417883, "loss": 0.0735, "step": 51050 }, { "epoch": 1.28, "learning_rate": 0.00107577318292591, "loss": 0.0738, "step": 51060 }, { "epoch": 1.28, "learning_rate": 0.001075396326910032, "loss": 0.0769, "step": 51070 }, { "epoch": 1.28, "learning_rate": 0.0010750194708941537, "loss": 0.0739, "step": 51080 }, { "epoch": 1.28, "learning_rate": 0.0010746426148782757, "loss": 0.073, "step": 51090 }, { "epoch": 1.28, "learning_rate": 0.0010742657588623972, "loss": 0.0721, "step": 51100 }, { "epoch": 1.28, "learning_rate": 0.0010738889028465192, "loss": 0.0745, "step": 51110 }, { "epoch": 1.28, "learning_rate": 0.001073512046830641, "loss": 0.0729, "step": 51120 }, { "epoch": 1.28, "learning_rate": 0.0010731351908147629, "loss": 0.0725, "step": 51130 }, { "epoch": 1.28, "learning_rate": 0.0010727583347988846, "loss": 0.0733, "step": 51140 }, { "epoch": 1.29, "learning_rate": 0.0010723814787830064, "loss": 0.0735, "step": 51150 }, { "epoch": 1.29, "learning_rate": 0.0010720046227671281, "loss": 0.074, "step": 51160 }, { "epoch": 1.29, "learning_rate": 0.00107162776675125, "loss": 0.0746, "step": 51170 }, { "epoch": 1.29, "learning_rate": 0.0010712509107353718, "loss": 0.0718, "step": 51180 }, { "epoch": 1.29, "learning_rate": 0.0010708740547194933, "loss": 0.0727, "step": 51190 }, { "epoch": 1.29, "learning_rate": 0.0010704971987036153, "loss": 0.0713, "step": 51200 }, { "epoch": 1.29, "learning_rate": 0.001070120342687737, "loss": 0.0702, "step": 51210 }, { "epoch": 1.29, "learning_rate": 0.001069743486671859, "loss": 0.0692, "step": 51220 }, { "epoch": 1.29, "learning_rate": 0.0010693666306559808, "loss": 0.074, "step": 51230 }, { "epoch": 1.29, "learning_rate": 0.0010689897746401025, "loss": 0.0725, "step": 51240 }, { "epoch": 1.29, "learning_rate": 0.0010686129186242242, "loss": 0.076, "step": 51250 }, { "epoch": 1.29, "learning_rate": 0.0010682360626083462, "loss": 0.072, "step": 51260 }, { "epoch": 1.29, "learning_rate": 0.001067859206592468, "loss": 0.0713, "step": 51270 }, { "epoch": 1.29, "learning_rate": 0.0010674823505765897, "loss": 0.0726, "step": 51280 }, { "epoch": 1.29, "learning_rate": 0.0010671054945607114, "loss": 0.0728, "step": 51290 }, { "epoch": 1.29, "learning_rate": 0.0010667286385448334, "loss": 0.0729, "step": 51300 }, { "epoch": 1.29, "learning_rate": 0.0010663517825289552, "loss": 0.0732, "step": 51310 }, { "epoch": 1.29, "learning_rate": 0.001065974926513077, "loss": 0.0726, "step": 51320 }, { "epoch": 1.29, "learning_rate": 0.0010655980704971986, "loss": 0.0739, "step": 51330 }, { "epoch": 1.29, "learning_rate": 0.0010652212144813206, "loss": 0.0724, "step": 51340 }, { "epoch": 1.29, "learning_rate": 0.0010648443584654423, "loss": 0.075, "step": 51350 }, { "epoch": 1.29, "learning_rate": 0.001064467502449564, "loss": 0.0707, "step": 51360 }, { "epoch": 1.29, "learning_rate": 0.0010640906464336858, "loss": 0.0743, "step": 51370 }, { "epoch": 1.29, "learning_rate": 0.0010637137904178078, "loss": 0.0726, "step": 51380 }, { "epoch": 1.29, "learning_rate": 0.0010633369344019295, "loss": 0.0736, "step": 51390 }, { "epoch": 1.29, "learning_rate": 0.0010629600783860513, "loss": 0.0706, "step": 51400 }, { "epoch": 1.29, "learning_rate": 0.001062583222370173, "loss": 0.0744, "step": 51410 }, { "epoch": 1.29, "learning_rate": 0.0010622063663542948, "loss": 0.0723, "step": 51420 }, { "epoch": 1.29, "learning_rate": 0.0010618295103384167, "loss": 0.075, "step": 51430 }, { "epoch": 1.29, "learning_rate": 0.0010614526543225385, "loss": 0.0715, "step": 51440 }, { "epoch": 1.29, "learning_rate": 0.0010610757983066604, "loss": 0.0701, "step": 51450 }, { "epoch": 1.29, "learning_rate": 0.001060698942290782, "loss": 0.0711, "step": 51460 }, { "epoch": 1.29, "learning_rate": 0.001060322086274904, "loss": 0.0731, "step": 51470 }, { "epoch": 1.29, "learning_rate": 0.0010599452302590257, "loss": 0.0721, "step": 51480 }, { "epoch": 1.29, "learning_rate": 0.0010595683742431476, "loss": 0.0705, "step": 51490 }, { "epoch": 1.29, "learning_rate": 0.0010591915182272694, "loss": 0.072, "step": 51500 }, { "epoch": 1.29, "eval_cer": 0.6655559870587539, "eval_loss": 0.0616888590157032, "eval_runtime": 91.034, "eval_samples_per_second": 109.838, "eval_steps_per_second": 6.866, "step": 51500 }, { "epoch": 1.29, "learning_rate": 0.0010588146622113911, "loss": 0.0705, "step": 51510 }, { "epoch": 1.29, "learning_rate": 0.0010584378061955129, "loss": 0.0754, "step": 51520 }, { "epoch": 1.29, "learning_rate": 0.0010580609501796348, "loss": 0.0735, "step": 51530 }, { "epoch": 1.29, "learning_rate": 0.0010576840941637566, "loss": 0.0748, "step": 51540 }, { "epoch": 1.3, "learning_rate": 0.0010573072381478783, "loss": 0.0736, "step": 51550 }, { "epoch": 1.3, "learning_rate": 0.001056930382132, "loss": 0.0704, "step": 51560 }, { "epoch": 1.3, "learning_rate": 0.001056553526116122, "loss": 0.0718, "step": 51570 }, { "epoch": 1.3, "learning_rate": 0.0010561766701002438, "loss": 0.0751, "step": 51580 }, { "epoch": 1.3, "learning_rate": 0.0010557998140843655, "loss": 0.069, "step": 51590 }, { "epoch": 1.3, "learning_rate": 0.0010554229580684873, "loss": 0.0723, "step": 51600 }, { "epoch": 1.3, "learning_rate": 0.0010550461020526092, "loss": 0.0691, "step": 51610 }, { "epoch": 1.3, "learning_rate": 0.001054669246036731, "loss": 0.0721, "step": 51620 }, { "epoch": 1.3, "learning_rate": 0.0010542923900208527, "loss": 0.0717, "step": 51630 }, { "epoch": 1.3, "learning_rate": 0.0010539155340049745, "loss": 0.0694, "step": 51640 }, { "epoch": 1.3, "learning_rate": 0.0010535386779890962, "loss": 0.0756, "step": 51650 }, { "epoch": 1.3, "learning_rate": 0.0010531618219732182, "loss": 0.0726, "step": 51660 }, { "epoch": 1.3, "learning_rate": 0.00105278496595734, "loss": 0.0762, "step": 51670 }, { "epoch": 1.3, "learning_rate": 0.0010524081099414617, "loss": 0.0737, "step": 51680 }, { "epoch": 1.3, "learning_rate": 0.0010520312539255834, "loss": 0.0721, "step": 51690 }, { "epoch": 1.3, "learning_rate": 0.0010516543979097054, "loss": 0.0731, "step": 51700 }, { "epoch": 1.3, "learning_rate": 0.001051277541893827, "loss": 0.0707, "step": 51710 }, { "epoch": 1.3, "learning_rate": 0.001050900685877949, "loss": 0.0745, "step": 51720 }, { "epoch": 1.3, "learning_rate": 0.0010505238298620706, "loss": 0.07, "step": 51730 }, { "epoch": 1.3, "learning_rate": 0.0010501469738461926, "loss": 0.0709, "step": 51740 }, { "epoch": 1.3, "learning_rate": 0.0010497701178303143, "loss": 0.0716, "step": 51750 }, { "epoch": 1.3, "learning_rate": 0.0010493932618144363, "loss": 0.0748, "step": 51760 }, { "epoch": 1.3, "learning_rate": 0.0010490164057985578, "loss": 0.0731, "step": 51770 }, { "epoch": 1.3, "learning_rate": 0.0010486395497826797, "loss": 0.0765, "step": 51780 }, { "epoch": 1.3, "learning_rate": 0.0010482626937668015, "loss": 0.0749, "step": 51790 }, { "epoch": 1.3, "learning_rate": 0.0010478858377509235, "loss": 0.0731, "step": 51800 }, { "epoch": 1.3, "learning_rate": 0.0010475089817350452, "loss": 0.0739, "step": 51810 }, { "epoch": 1.3, "learning_rate": 0.001047132125719167, "loss": 0.0741, "step": 51820 }, { "epoch": 1.3, "learning_rate": 0.0010467552697032887, "loss": 0.0737, "step": 51830 }, { "epoch": 1.3, "learning_rate": 0.0010463784136874104, "loss": 0.0737, "step": 51840 }, { "epoch": 1.3, "learning_rate": 0.0010460015576715324, "loss": 0.0729, "step": 51850 }, { "epoch": 1.3, "learning_rate": 0.0010456247016556541, "loss": 0.071, "step": 51860 }, { "epoch": 1.3, "learning_rate": 0.0010452478456397759, "loss": 0.072, "step": 51870 }, { "epoch": 1.3, "learning_rate": 0.0010448709896238976, "loss": 0.0693, "step": 51880 }, { "epoch": 1.3, "learning_rate": 0.0010444941336080196, "loss": 0.0739, "step": 51890 }, { "epoch": 1.3, "learning_rate": 0.0010441172775921413, "loss": 0.0753, "step": 51900 }, { "epoch": 1.3, "learning_rate": 0.001043740421576263, "loss": 0.0736, "step": 51910 }, { "epoch": 1.3, "learning_rate": 0.0010433635655603848, "loss": 0.0729, "step": 51920 }, { "epoch": 1.3, "learning_rate": 0.0010429867095445068, "loss": 0.0731, "step": 51930 }, { "epoch": 1.3, "learning_rate": 0.0010426098535286285, "loss": 0.0704, "step": 51940 }, { "epoch": 1.31, "learning_rate": 0.0010422329975127503, "loss": 0.0721, "step": 51950 }, { "epoch": 1.31, "learning_rate": 0.001041856141496872, "loss": 0.0716, "step": 51960 }, { "epoch": 1.31, "learning_rate": 0.001041479285480994, "loss": 0.0714, "step": 51970 }, { "epoch": 1.31, "learning_rate": 0.0010411024294651157, "loss": 0.0706, "step": 51980 }, { "epoch": 1.31, "learning_rate": 0.0010407255734492375, "loss": 0.0709, "step": 51990 }, { "epoch": 1.31, "learning_rate": 0.0010403487174333592, "loss": 0.0718, "step": 52000 }, { "epoch": 1.31, "eval_cer": 0.6653235528080512, "eval_loss": 0.06183711811900139, "eval_runtime": 91.0284, "eval_samples_per_second": 109.845, "eval_steps_per_second": 6.866, "step": 52000 }, { "epoch": 1.31, "learning_rate": 0.0010399718614174812, "loss": 0.0703, "step": 52010 }, { "epoch": 1.31, "learning_rate": 0.001039595005401603, "loss": 0.0703, "step": 52020 }, { "epoch": 1.31, "learning_rate": 0.0010392181493857249, "loss": 0.0732, "step": 52030 }, { "epoch": 1.31, "learning_rate": 0.0010388412933698464, "loss": 0.0729, "step": 52040 }, { "epoch": 1.31, "learning_rate": 0.0010384644373539684, "loss": 0.0738, "step": 52050 }, { "epoch": 1.31, "learning_rate": 0.0010380875813380901, "loss": 0.0747, "step": 52060 }, { "epoch": 1.31, "learning_rate": 0.0010377107253222119, "loss": 0.0749, "step": 52070 }, { "epoch": 1.31, "learning_rate": 0.0010373338693063338, "loss": 0.0732, "step": 52080 }, { "epoch": 1.31, "learning_rate": 0.0010369570132904554, "loss": 0.075, "step": 52090 }, { "epoch": 1.31, "learning_rate": 0.0010365801572745773, "loss": 0.0721, "step": 52100 }, { "epoch": 1.31, "learning_rate": 0.001036203301258699, "loss": 0.0716, "step": 52110 }, { "epoch": 1.31, "learning_rate": 0.001035826445242821, "loss": 0.0721, "step": 52120 }, { "epoch": 1.31, "learning_rate": 0.0010354495892269428, "loss": 0.075, "step": 52130 }, { "epoch": 1.31, "learning_rate": 0.0010350727332110645, "loss": 0.0739, "step": 52140 }, { "epoch": 1.31, "learning_rate": 0.0010346958771951863, "loss": 0.071, "step": 52150 }, { "epoch": 1.31, "learning_rate": 0.0010343190211793082, "loss": 0.0702, "step": 52160 }, { "epoch": 1.31, "learning_rate": 0.00103394216516343, "loss": 0.0759, "step": 52170 }, { "epoch": 1.31, "learning_rate": 0.0010335653091475517, "loss": 0.0765, "step": 52180 }, { "epoch": 1.31, "learning_rate": 0.0010331884531316734, "loss": 0.0735, "step": 52190 }, { "epoch": 1.31, "learning_rate": 0.0010328115971157954, "loss": 0.0722, "step": 52200 }, { "epoch": 1.31, "learning_rate": 0.0010324347410999172, "loss": 0.0718, "step": 52210 }, { "epoch": 1.31, "learning_rate": 0.001032057885084039, "loss": 0.0712, "step": 52220 }, { "epoch": 1.31, "learning_rate": 0.0010316810290681606, "loss": 0.0741, "step": 52230 }, { "epoch": 1.31, "learning_rate": 0.0010313041730522826, "loss": 0.071, "step": 52240 }, { "epoch": 1.31, "learning_rate": 0.0010309273170364043, "loss": 0.0719, "step": 52250 }, { "epoch": 1.31, "learning_rate": 0.001030550461020526, "loss": 0.07, "step": 52260 }, { "epoch": 1.31, "learning_rate": 0.0010301736050046478, "loss": 0.0736, "step": 52270 }, { "epoch": 1.31, "learning_rate": 0.0010297967489887698, "loss": 0.0734, "step": 52280 }, { "epoch": 1.31, "learning_rate": 0.0010294198929728915, "loss": 0.0736, "step": 52290 }, { "epoch": 1.31, "learning_rate": 0.0010290430369570133, "loss": 0.0706, "step": 52300 }, { "epoch": 1.31, "learning_rate": 0.001028666180941135, "loss": 0.0719, "step": 52310 }, { "epoch": 1.31, "learning_rate": 0.0010282893249252568, "loss": 0.0728, "step": 52320 }, { "epoch": 1.31, "learning_rate": 0.0010279124689093787, "loss": 0.0694, "step": 52330 }, { "epoch": 1.31, "learning_rate": 0.0010275356128935005, "loss": 0.0718, "step": 52340 }, { "epoch": 1.32, "learning_rate": 0.0010271587568776222, "loss": 0.0706, "step": 52350 }, { "epoch": 1.32, "learning_rate": 0.001026781900861744, "loss": 0.0725, "step": 52360 }, { "epoch": 1.32, "learning_rate": 0.001026405044845866, "loss": 0.072, "step": 52370 }, { "epoch": 1.32, "learning_rate": 0.0010260281888299877, "loss": 0.0752, "step": 52380 }, { "epoch": 1.32, "learning_rate": 0.0010256513328141096, "loss": 0.0722, "step": 52390 }, { "epoch": 1.32, "learning_rate": 0.0010252744767982312, "loss": 0.0748, "step": 52400 }, { "epoch": 1.32, "learning_rate": 0.0010248976207823531, "loss": 0.073, "step": 52410 }, { "epoch": 1.32, "learning_rate": 0.0010245207647664749, "loss": 0.07, "step": 52420 }, { "epoch": 1.32, "learning_rate": 0.0010241439087505968, "loss": 0.0692, "step": 52430 }, { "epoch": 1.32, "learning_rate": 0.0010237670527347186, "loss": 0.0743, "step": 52440 }, { "epoch": 1.32, "learning_rate": 0.0010233901967188403, "loss": 0.077, "step": 52450 }, { "epoch": 1.32, "learning_rate": 0.001023013340702962, "loss": 0.0756, "step": 52460 }, { "epoch": 1.32, "learning_rate": 0.001022636484687084, "loss": 0.073, "step": 52470 }, { "epoch": 1.32, "learning_rate": 0.0010222596286712058, "loss": 0.0715, "step": 52480 }, { "epoch": 1.32, "learning_rate": 0.0010218827726553275, "loss": 0.0715, "step": 52490 }, { "epoch": 1.32, "learning_rate": 0.0010215059166394493, "loss": 0.0703, "step": 52500 }, { "epoch": 1.32, "eval_cer": 0.6654621471438739, "eval_loss": 0.06106410175561905, "eval_runtime": 90.7505, "eval_samples_per_second": 110.181, "eval_steps_per_second": 6.887, "step": 52500 }, { "epoch": 1.32, "learning_rate": 0.001021129060623571, "loss": 0.0698, "step": 52510 }, { "epoch": 1.32, "learning_rate": 0.001020752204607693, "loss": 0.0719, "step": 52520 }, { "epoch": 1.32, "learning_rate": 0.0010203753485918147, "loss": 0.073, "step": 52530 }, { "epoch": 1.32, "learning_rate": 0.0010199984925759365, "loss": 0.0707, "step": 52540 }, { "epoch": 1.32, "learning_rate": 0.0010196216365600582, "loss": 0.072, "step": 52550 }, { "epoch": 1.32, "learning_rate": 0.0010192447805441802, "loss": 0.0704, "step": 52560 }, { "epoch": 1.32, "learning_rate": 0.001018867924528302, "loss": 0.0717, "step": 52570 }, { "epoch": 1.32, "learning_rate": 0.0010184910685124237, "loss": 0.0709, "step": 52580 }, { "epoch": 1.32, "learning_rate": 0.0010181142124965454, "loss": 0.0738, "step": 52590 }, { "epoch": 1.32, "learning_rate": 0.0010177373564806674, "loss": 0.067, "step": 52600 }, { "epoch": 1.32, "learning_rate": 0.001017360500464789, "loss": 0.07, "step": 52610 }, { "epoch": 1.32, "learning_rate": 0.0010169836444489109, "loss": 0.072, "step": 52620 }, { "epoch": 1.32, "learning_rate": 0.0010166067884330326, "loss": 0.0748, "step": 52630 }, { "epoch": 1.32, "learning_rate": 0.0010162299324171546, "loss": 0.0709, "step": 52640 }, { "epoch": 1.32, "learning_rate": 0.0010158530764012763, "loss": 0.0732, "step": 52650 }, { "epoch": 1.32, "learning_rate": 0.0010154762203853983, "loss": 0.0708, "step": 52660 }, { "epoch": 1.32, "learning_rate": 0.0010150993643695198, "loss": 0.0752, "step": 52670 }, { "epoch": 1.32, "learning_rate": 0.0010147225083536418, "loss": 0.0717, "step": 52680 }, { "epoch": 1.32, "learning_rate": 0.0010143456523377635, "loss": 0.073, "step": 52690 }, { "epoch": 1.32, "learning_rate": 0.0010139687963218855, "loss": 0.071, "step": 52700 }, { "epoch": 1.32, "learning_rate": 0.0010135919403060072, "loss": 0.07, "step": 52710 }, { "epoch": 1.32, "learning_rate": 0.001013215084290129, "loss": 0.0735, "step": 52720 }, { "epoch": 1.32, "learning_rate": 0.0010128382282742507, "loss": 0.0759, "step": 52730 }, { "epoch": 1.33, "learning_rate": 0.0010124613722583724, "loss": 0.0733, "step": 52740 }, { "epoch": 1.33, "learning_rate": 0.0010120845162424944, "loss": 0.0738, "step": 52750 }, { "epoch": 1.33, "learning_rate": 0.001011707660226616, "loss": 0.071, "step": 52760 }, { "epoch": 1.33, "learning_rate": 0.0010113308042107379, "loss": 0.0747, "step": 52770 }, { "epoch": 1.33, "learning_rate": 0.0010109539481948596, "loss": 0.075, "step": 52780 }, { "epoch": 1.33, "learning_rate": 0.0010105770921789816, "loss": 0.0727, "step": 52790 }, { "epoch": 1.33, "learning_rate": 0.0010102002361631033, "loss": 0.0747, "step": 52800 }, { "epoch": 1.33, "learning_rate": 0.001009823380147225, "loss": 0.0732, "step": 52810 }, { "epoch": 1.33, "learning_rate": 0.0010094465241313468, "loss": 0.0699, "step": 52820 }, { "epoch": 1.33, "learning_rate": 0.0010090696681154688, "loss": 0.0717, "step": 52830 }, { "epoch": 1.33, "learning_rate": 0.0010086928120995905, "loss": 0.0679, "step": 52840 }, { "epoch": 1.33, "learning_rate": 0.0010083159560837123, "loss": 0.0713, "step": 52850 }, { "epoch": 1.33, "learning_rate": 0.001007939100067834, "loss": 0.0747, "step": 52860 }, { "epoch": 1.33, "learning_rate": 0.001007562244051956, "loss": 0.073, "step": 52870 }, { "epoch": 1.33, "learning_rate": 0.0010071853880360777, "loss": 0.074, "step": 52880 }, { "epoch": 1.33, "learning_rate": 0.0010068085320201995, "loss": 0.0758, "step": 52890 }, { "epoch": 1.33, "learning_rate": 0.0010064316760043212, "loss": 0.0721, "step": 52900 }, { "epoch": 1.33, "learning_rate": 0.0010060548199884432, "loss": 0.0704, "step": 52910 }, { "epoch": 1.33, "learning_rate": 0.001005677963972565, "loss": 0.074, "step": 52920 }, { "epoch": 1.33, "learning_rate": 0.0010053011079566867, "loss": 0.0716, "step": 52930 }, { "epoch": 1.33, "learning_rate": 0.0010049242519408084, "loss": 0.0735, "step": 52940 }, { "epoch": 1.33, "learning_rate": 0.0010045473959249304, "loss": 0.0705, "step": 52950 }, { "epoch": 1.33, "learning_rate": 0.0010041705399090521, "loss": 0.0727, "step": 52960 }, { "epoch": 1.33, "learning_rate": 0.0010037936838931739, "loss": 0.0741, "step": 52970 }, { "epoch": 1.33, "learning_rate": 0.0010034168278772956, "loss": 0.0699, "step": 52980 }, { "epoch": 1.33, "learning_rate": 0.0010030399718614174, "loss": 0.071, "step": 52990 }, { "epoch": 1.33, "learning_rate": 0.0010026631158455393, "loss": 0.0718, "step": 53000 }, { "epoch": 1.33, "eval_cer": 0.6655482873734304, "eval_loss": 0.06082231178879738, "eval_runtime": 90.7973, "eval_samples_per_second": 110.124, "eval_steps_per_second": 6.883, "step": 53000 }, { "epoch": 1.33, "learning_rate": 0.001002286259829661, "loss": 0.072, "step": 53010 }, { "epoch": 1.33, "learning_rate": 0.001001909403813783, "loss": 0.0687, "step": 53020 }, { "epoch": 1.33, "learning_rate": 0.0010015325477979046, "loss": 0.0701, "step": 53030 }, { "epoch": 1.33, "learning_rate": 0.0010011556917820265, "loss": 0.072, "step": 53040 }, { "epoch": 1.33, "learning_rate": 0.0010007788357661483, "loss": 0.0746, "step": 53050 }, { "epoch": 1.33, "learning_rate": 0.0010004019797502702, "loss": 0.0726, "step": 53060 }, { "epoch": 1.33, "learning_rate": 0.001000025123734392, "loss": 0.0694, "step": 53070 }, { "epoch": 1.33, "learning_rate": 0.0009996482677185137, "loss": 0.0733, "step": 53080 }, { "epoch": 1.33, "learning_rate": 0.0009992714117026355, "loss": 0.0767, "step": 53090 }, { "epoch": 1.33, "learning_rate": 0.0009988945556867574, "loss": 0.0724, "step": 53100 }, { "epoch": 1.33, "learning_rate": 0.0009985176996708792, "loss": 0.0753, "step": 53110 }, { "epoch": 1.33, "learning_rate": 0.000998140843655001, "loss": 0.0718, "step": 53120 }, { "epoch": 1.33, "learning_rate": 0.0009977639876391226, "loss": 0.0731, "step": 53130 }, { "epoch": 1.34, "learning_rate": 0.0009973871316232446, "loss": 0.073, "step": 53140 }, { "epoch": 1.34, "learning_rate": 0.0009970102756073664, "loss": 0.0725, "step": 53150 }, { "epoch": 1.34, "learning_rate": 0.000996633419591488, "loss": 0.0702, "step": 53160 }, { "epoch": 1.34, "learning_rate": 0.0009962565635756098, "loss": 0.0718, "step": 53170 }, { "epoch": 1.34, "learning_rate": 0.0009958797075597316, "loss": 0.0698, "step": 53180 }, { "epoch": 1.34, "learning_rate": 0.0009955028515438535, "loss": 0.0738, "step": 53190 }, { "epoch": 1.34, "learning_rate": 0.0009951259955279753, "loss": 0.0708, "step": 53200 }, { "epoch": 1.34, "learning_rate": 0.000994749139512097, "loss": 0.0719, "step": 53210 }, { "epoch": 1.34, "learning_rate": 0.0009943722834962188, "loss": 0.0705, "step": 53220 }, { "epoch": 1.34, "learning_rate": 0.0009939954274803407, "loss": 0.0735, "step": 53230 }, { "epoch": 1.34, "learning_rate": 0.0009936185714644625, "loss": 0.0689, "step": 53240 }, { "epoch": 1.34, "learning_rate": 0.0009932417154485842, "loss": 0.0734, "step": 53250 }, { "epoch": 1.34, "learning_rate": 0.000992864859432706, "loss": 0.0702, "step": 53260 }, { "epoch": 1.34, "learning_rate": 0.000992488003416828, "loss": 0.0728, "step": 53270 }, { "epoch": 1.34, "learning_rate": 0.0009921111474009497, "loss": 0.0755, "step": 53280 }, { "epoch": 1.34, "learning_rate": 0.0009917342913850716, "loss": 0.0705, "step": 53290 }, { "epoch": 1.34, "learning_rate": 0.0009913574353691932, "loss": 0.0708, "step": 53300 }, { "epoch": 1.34, "learning_rate": 0.0009909805793533151, "loss": 0.0678, "step": 53310 }, { "epoch": 1.34, "learning_rate": 0.0009906037233374369, "loss": 0.0701, "step": 53320 }, { "epoch": 1.34, "learning_rate": 0.0009902268673215588, "loss": 0.0708, "step": 53330 }, { "epoch": 1.34, "learning_rate": 0.0009898500113056804, "loss": 0.0682, "step": 53340 }, { "epoch": 1.34, "learning_rate": 0.0009894731552898023, "loss": 0.0692, "step": 53350 }, { "epoch": 1.34, "learning_rate": 0.000989096299273924, "loss": 0.0732, "step": 53360 }, { "epoch": 1.34, "learning_rate": 0.000988719443258046, "loss": 0.0717, "step": 53370 }, { "epoch": 1.34, "learning_rate": 0.0009883425872421678, "loss": 0.0711, "step": 53380 }, { "epoch": 1.34, "learning_rate": 0.0009879657312262895, "loss": 0.0732, "step": 53390 }, { "epoch": 1.34, "learning_rate": 0.0009875888752104113, "loss": 0.0734, "step": 53400 }, { "epoch": 1.34, "learning_rate": 0.000987212019194533, "loss": 0.0754, "step": 53410 }, { "epoch": 1.34, "learning_rate": 0.000986835163178655, "loss": 0.0732, "step": 53420 }, { "epoch": 1.34, "learning_rate": 0.0009864583071627767, "loss": 0.0717, "step": 53430 }, { "epoch": 1.34, "learning_rate": 0.0009860814511468985, "loss": 0.0724, "step": 53440 }, { "epoch": 1.34, "learning_rate": 0.0009857045951310202, "loss": 0.0711, "step": 53450 }, { "epoch": 1.34, "learning_rate": 0.0009853277391151422, "loss": 0.0715, "step": 53460 }, { "epoch": 1.34, "learning_rate": 0.000984950883099264, "loss": 0.07, "step": 53470 }, { "epoch": 1.34, "learning_rate": 0.0009845740270833857, "loss": 0.073, "step": 53480 }, { "epoch": 1.34, "learning_rate": 0.0009841971710675074, "loss": 0.0724, "step": 53490 }, { "epoch": 1.34, "learning_rate": 0.0009838203150516294, "loss": 0.0686, "step": 53500 }, { "epoch": 1.34, "eval_cer": 0.6653375084877, "eval_loss": 0.06101470813155174, "eval_runtime": 90.6137, "eval_samples_per_second": 110.348, "eval_steps_per_second": 6.897, "step": 53500 }, { "epoch": 1.34, "learning_rate": 0.0009834434590357511, "loss": 0.0681, "step": 53510 }, { "epoch": 1.34, "learning_rate": 0.0009830666030198729, "loss": 0.067, "step": 53520 }, { "epoch": 1.34, "learning_rate": 0.0009826897470039946, "loss": 0.0727, "step": 53530 }, { "epoch": 1.35, "learning_rate": 0.0009823128909881166, "loss": 0.0722, "step": 53540 }, { "epoch": 1.35, "learning_rate": 0.0009819360349722383, "loss": 0.0716, "step": 53550 }, { "epoch": 1.35, "learning_rate": 0.00098155917895636, "loss": 0.0718, "step": 53560 }, { "epoch": 1.35, "learning_rate": 0.0009811823229404818, "loss": 0.0726, "step": 53570 }, { "epoch": 1.35, "learning_rate": 0.0009808054669246038, "loss": 0.0677, "step": 53580 }, { "epoch": 1.35, "learning_rate": 0.0009804286109087255, "loss": 0.0702, "step": 53590 }, { "epoch": 1.35, "learning_rate": 0.0009800517548928475, "loss": 0.0701, "step": 53600 }, { "epoch": 1.35, "learning_rate": 0.000979674898876969, "loss": 0.072, "step": 53610 }, { "epoch": 1.35, "learning_rate": 0.0009792980428610907, "loss": 0.0723, "step": 53620 }, { "epoch": 1.35, "learning_rate": 0.0009789211868452127, "loss": 0.0696, "step": 53630 }, { "epoch": 1.35, "learning_rate": 0.0009785443308293344, "loss": 0.0715, "step": 53640 }, { "epoch": 1.35, "learning_rate": 0.0009781674748134564, "loss": 0.0733, "step": 53650 }, { "epoch": 1.35, "learning_rate": 0.000977790618797578, "loss": 0.0751, "step": 53660 }, { "epoch": 1.35, "learning_rate": 0.0009774137627817, "loss": 0.0722, "step": 53670 }, { "epoch": 1.35, "learning_rate": 0.0009770369067658216, "loss": 0.0675, "step": 53680 }, { "epoch": 1.35, "learning_rate": 0.0009766600507499436, "loss": 0.068, "step": 53690 }, { "epoch": 1.35, "learning_rate": 0.0009762831947340652, "loss": 0.0714, "step": 53700 }, { "epoch": 1.35, "learning_rate": 0.0009759063387181871, "loss": 0.0723, "step": 53710 }, { "epoch": 1.35, "learning_rate": 0.0009755294827023088, "loss": 0.073, "step": 53720 }, { "epoch": 1.35, "learning_rate": 0.0009751526266864307, "loss": 0.0702, "step": 53730 }, { "epoch": 1.35, "learning_rate": 0.0009747757706705524, "loss": 0.0757, "step": 53740 }, { "epoch": 1.35, "learning_rate": 0.0009743989146546744, "loss": 0.0702, "step": 53750 }, { "epoch": 1.35, "learning_rate": 0.000974022058638796, "loss": 0.0722, "step": 53760 }, { "epoch": 1.35, "learning_rate": 0.000973645202622918, "loss": 0.0747, "step": 53770 }, { "epoch": 1.35, "learning_rate": 0.0009732683466070396, "loss": 0.0731, "step": 53780 }, { "epoch": 1.35, "learning_rate": 0.0009728914905911616, "loss": 0.0745, "step": 53790 }, { "epoch": 1.35, "learning_rate": 0.0009725146345752832, "loss": 0.0717, "step": 53800 }, { "epoch": 1.35, "learning_rate": 0.0009721377785594052, "loss": 0.0748, "step": 53810 }, { "epoch": 1.35, "learning_rate": 0.0009717609225435269, "loss": 0.0734, "step": 53820 }, { "epoch": 1.35, "learning_rate": 0.0009713840665276488, "loss": 0.0734, "step": 53830 }, { "epoch": 1.35, "learning_rate": 0.0009710072105117705, "loss": 0.0695, "step": 53840 }, { "epoch": 1.35, "learning_rate": 0.0009706303544958922, "loss": 0.0715, "step": 53850 }, { "epoch": 1.35, "learning_rate": 0.0009702534984800141, "loss": 0.0708, "step": 53860 }, { "epoch": 1.35, "learning_rate": 0.0009698766424641359, "loss": 0.07, "step": 53870 }, { "epoch": 1.35, "learning_rate": 0.0009694997864482577, "loss": 0.0709, "step": 53880 }, { "epoch": 1.35, "learning_rate": 0.0009691229304323795, "loss": 0.0742, "step": 53890 }, { "epoch": 1.35, "learning_rate": 0.0009687460744165013, "loss": 0.0708, "step": 53900 }, { "epoch": 1.35, "learning_rate": 0.0009683692184006231, "loss": 0.0711, "step": 53910 }, { "epoch": 1.35, "learning_rate": 0.0009679923623847449, "loss": 0.068, "step": 53920 }, { "epoch": 1.35, "learning_rate": 0.0009676155063688667, "loss": 0.0715, "step": 53930 }, { "epoch": 1.36, "learning_rate": 0.0009672386503529885, "loss": 0.073, "step": 53940 }, { "epoch": 1.36, "learning_rate": 0.0009668617943371103, "loss": 0.0709, "step": 53950 }, { "epoch": 1.36, "learning_rate": 0.0009664849383212321, "loss": 0.0699, "step": 53960 }, { "epoch": 1.36, "learning_rate": 0.0009661080823053539, "loss": 0.0715, "step": 53970 }, { "epoch": 1.36, "learning_rate": 0.0009657312262894757, "loss": 0.0722, "step": 53980 }, { "epoch": 1.36, "learning_rate": 0.0009653543702735975, "loss": 0.0668, "step": 53990 }, { "epoch": 1.36, "learning_rate": 0.0009649775142577193, "loss": 0.0688, "step": 54000 }, { "epoch": 1.36, "eval_cer": 0.6656522331252974, "eval_loss": 0.060397226363420486, "eval_runtime": 90.8096, "eval_samples_per_second": 110.11, "eval_steps_per_second": 6.883, "step": 54000 }, { "epoch": 1.36, "learning_rate": 0.000964600658241841, "loss": 0.0686, "step": 54010 }, { "epoch": 1.36, "learning_rate": 0.0009642238022259629, "loss": 0.0727, "step": 54020 }, { "epoch": 1.36, "learning_rate": 0.0009638469462100847, "loss": 0.0683, "step": 54030 }, { "epoch": 1.36, "learning_rate": 0.0009634700901942066, "loss": 0.0678, "step": 54040 }, { "epoch": 1.36, "learning_rate": 0.0009630932341783282, "loss": 0.0718, "step": 54050 }, { "epoch": 1.36, "learning_rate": 0.0009627163781624502, "loss": 0.0727, "step": 54060 }, { "epoch": 1.36, "learning_rate": 0.0009623395221465718, "loss": 0.0712, "step": 54070 }, { "epoch": 1.36, "learning_rate": 0.0009619626661306936, "loss": 0.0725, "step": 54080 }, { "epoch": 1.36, "learning_rate": 0.0009615858101148154, "loss": 0.0715, "step": 54090 }, { "epoch": 1.36, "learning_rate": 0.0009612089540989372, "loss": 0.0701, "step": 54100 }, { "epoch": 1.36, "learning_rate": 0.0009608320980830591, "loss": 0.0725, "step": 54110 }, { "epoch": 1.36, "learning_rate": 0.0009604552420671808, "loss": 0.075, "step": 54120 }, { "epoch": 1.36, "learning_rate": 0.0009600783860513027, "loss": 0.0692, "step": 54130 }, { "epoch": 1.36, "learning_rate": 0.0009597015300354244, "loss": 0.0724, "step": 54140 }, { "epoch": 1.36, "learning_rate": 0.0009593246740195463, "loss": 0.067, "step": 54150 }, { "epoch": 1.36, "learning_rate": 0.0009589478180036681, "loss": 0.0737, "step": 54160 }, { "epoch": 1.36, "learning_rate": 0.0009585709619877899, "loss": 0.0668, "step": 54170 }, { "epoch": 1.36, "learning_rate": 0.0009581941059719117, "loss": 0.0715, "step": 54180 }, { "epoch": 1.36, "learning_rate": 0.0009578172499560335, "loss": 0.0717, "step": 54190 }, { "epoch": 1.36, "learning_rate": 0.0009574403939401553, "loss": 0.0748, "step": 54200 }, { "epoch": 1.36, "learning_rate": 0.0009570635379242771, "loss": 0.0702, "step": 54210 }, { "epoch": 1.36, "learning_rate": 0.0009566866819083989, "loss": 0.0734, "step": 54220 }, { "epoch": 1.36, "learning_rate": 0.0009563098258925207, "loss": 0.0703, "step": 54230 }, { "epoch": 1.36, "learning_rate": 0.0009559329698766425, "loss": 0.0712, "step": 54240 }, { "epoch": 1.36, "learning_rate": 0.0009555561138607643, "loss": 0.0733, "step": 54250 }, { "epoch": 1.36, "learning_rate": 0.0009551792578448861, "loss": 0.0693, "step": 54260 }, { "epoch": 1.36, "learning_rate": 0.0009548024018290079, "loss": 0.0699, "step": 54270 }, { "epoch": 1.36, "learning_rate": 0.0009544255458131297, "loss": 0.0729, "step": 54280 }, { "epoch": 1.36, "learning_rate": 0.0009540486897972514, "loss": 0.0699, "step": 54290 }, { "epoch": 1.36, "learning_rate": 0.0009536718337813733, "loss": 0.0693, "step": 54300 }, { "epoch": 1.36, "learning_rate": 0.000953294977765495, "loss": 0.0734, "step": 54310 }, { "epoch": 1.36, "learning_rate": 0.0009529181217496169, "loss": 0.0684, "step": 54320 }, { "epoch": 1.36, "learning_rate": 0.0009525412657337386, "loss": 0.0711, "step": 54330 }, { "epoch": 1.37, "learning_rate": 0.0009521644097178605, "loss": 0.0725, "step": 54340 }, { "epoch": 1.37, "learning_rate": 0.0009517875537019822, "loss": 0.074, "step": 54350 }, { "epoch": 1.37, "learning_rate": 0.0009514106976861041, "loss": 0.0689, "step": 54360 }, { "epoch": 1.37, "learning_rate": 0.0009510338416702258, "loss": 0.0725, "step": 54370 }, { "epoch": 1.37, "learning_rate": 0.0009506569856543477, "loss": 0.0691, "step": 54380 }, { "epoch": 1.37, "learning_rate": 0.0009502801296384694, "loss": 0.0711, "step": 54390 }, { "epoch": 1.37, "learning_rate": 0.0009499032736225914, "loss": 0.0654, "step": 54400 }, { "epoch": 1.37, "learning_rate": 0.000949526417606713, "loss": 0.0706, "step": 54410 }, { "epoch": 1.37, "learning_rate": 0.000949149561590835, "loss": 0.0704, "step": 54420 }, { "epoch": 1.37, "learning_rate": 0.0009487727055749566, "loss": 0.0744, "step": 54430 }, { "epoch": 1.37, "learning_rate": 0.0009483958495590786, "loss": 0.0717, "step": 54440 }, { "epoch": 1.37, "learning_rate": 0.0009480189935432003, "loss": 0.0697, "step": 54450 }, { "epoch": 1.37, "learning_rate": 0.0009476421375273222, "loss": 0.0716, "step": 54460 }, { "epoch": 1.37, "learning_rate": 0.0009472652815114439, "loss": 0.069, "step": 54470 }, { "epoch": 1.37, "learning_rate": 0.0009468884254955658, "loss": 0.0711, "step": 54480 }, { "epoch": 1.37, "learning_rate": 0.0009465115694796875, "loss": 0.0708, "step": 54490 }, { "epoch": 1.37, "learning_rate": 0.0009461347134638094, "loss": 0.0694, "step": 54500 }, { "epoch": 1.37, "eval_cer": 0.6656171033110091, "eval_loss": 0.06041229888796806, "eval_runtime": 90.7001, "eval_samples_per_second": 110.242, "eval_steps_per_second": 6.891, "step": 54500 }, { "epoch": 1.37, "learning_rate": 0.0009457578574479311, "loss": 0.0685, "step": 54510 }, { "epoch": 1.37, "learning_rate": 0.0009453810014320528, "loss": 0.071, "step": 54520 }, { "epoch": 1.37, "learning_rate": 0.0009450041454161747, "loss": 0.0692, "step": 54530 }, { "epoch": 1.37, "learning_rate": 0.0009446272894002964, "loss": 0.0709, "step": 54540 }, { "epoch": 1.37, "learning_rate": 0.0009442504333844183, "loss": 0.077, "step": 54550 }, { "epoch": 1.37, "learning_rate": 0.00094387357736854, "loss": 0.0719, "step": 54560 }, { "epoch": 1.37, "learning_rate": 0.0009434967213526619, "loss": 0.0736, "step": 54570 }, { "epoch": 1.37, "learning_rate": 0.0009431198653367836, "loss": 0.0701, "step": 54580 }, { "epoch": 1.37, "learning_rate": 0.0009427430093209055, "loss": 0.0678, "step": 54590 }, { "epoch": 1.37, "learning_rate": 0.0009423661533050272, "loss": 0.072, "step": 54600 }, { "epoch": 1.37, "learning_rate": 0.0009419892972891491, "loss": 0.0728, "step": 54610 }, { "epoch": 1.37, "learning_rate": 0.0009416124412732708, "loss": 0.0688, "step": 54620 }, { "epoch": 1.37, "learning_rate": 0.0009412355852573927, "loss": 0.0728, "step": 54630 }, { "epoch": 1.37, "learning_rate": 0.0009408587292415144, "loss": 0.0724, "step": 54640 }, { "epoch": 1.37, "learning_rate": 0.0009404818732256363, "loss": 0.0699, "step": 54650 }, { "epoch": 1.37, "learning_rate": 0.000940105017209758, "loss": 0.0712, "step": 54660 }, { "epoch": 1.37, "learning_rate": 0.0009397281611938799, "loss": 0.0722, "step": 54670 }, { "epoch": 1.37, "learning_rate": 0.0009393513051780016, "loss": 0.0721, "step": 54680 }, { "epoch": 1.37, "learning_rate": 0.0009389744491621236, "loss": 0.0688, "step": 54690 }, { "epoch": 1.37, "learning_rate": 0.0009385975931462452, "loss": 0.0696, "step": 54700 }, { "epoch": 1.37, "learning_rate": 0.0009382207371303672, "loss": 0.0704, "step": 54710 }, { "epoch": 1.37, "learning_rate": 0.0009378438811144888, "loss": 0.0704, "step": 54720 }, { "epoch": 1.38, "learning_rate": 0.0009374670250986108, "loss": 0.0748, "step": 54730 }, { "epoch": 1.38, "learning_rate": 0.0009370901690827325, "loss": 0.067, "step": 54740 }, { "epoch": 1.38, "learning_rate": 0.0009367133130668542, "loss": 0.0719, "step": 54750 }, { "epoch": 1.38, "learning_rate": 0.0009363364570509761, "loss": 0.0705, "step": 54760 }, { "epoch": 1.38, "learning_rate": 0.0009359596010350978, "loss": 0.0705, "step": 54770 }, { "epoch": 1.38, "learning_rate": 0.0009355827450192197, "loss": 0.0705, "step": 54780 }, { "epoch": 1.38, "learning_rate": 0.0009352058890033414, "loss": 0.0725, "step": 54790 }, { "epoch": 1.38, "learning_rate": 0.0009348290329874633, "loss": 0.0699, "step": 54800 }, { "epoch": 1.38, "learning_rate": 0.0009344521769715851, "loss": 0.0701, "step": 54810 }, { "epoch": 1.38, "learning_rate": 0.0009340753209557069, "loss": 0.0711, "step": 54820 }, { "epoch": 1.38, "learning_rate": 0.0009336984649398287, "loss": 0.0724, "step": 54830 }, { "epoch": 1.38, "learning_rate": 0.0009333216089239505, "loss": 0.0732, "step": 54840 }, { "epoch": 1.38, "learning_rate": 0.0009329447529080723, "loss": 0.0687, "step": 54850 }, { "epoch": 1.38, "learning_rate": 0.0009325678968921941, "loss": 0.0717, "step": 54860 }, { "epoch": 1.38, "learning_rate": 0.0009321910408763159, "loss": 0.0716, "step": 54870 }, { "epoch": 1.38, "learning_rate": 0.0009318141848604377, "loss": 0.0712, "step": 54880 }, { "epoch": 1.38, "learning_rate": 0.0009314373288445595, "loss": 0.0679, "step": 54890 }, { "epoch": 1.38, "learning_rate": 0.0009310604728286813, "loss": 0.0662, "step": 54900 }, { "epoch": 1.38, "learning_rate": 0.0009306836168128031, "loss": 0.0686, "step": 54910 }, { "epoch": 1.38, "learning_rate": 0.0009303067607969249, "loss": 0.0679, "step": 54920 }, { "epoch": 1.38, "learning_rate": 0.0009299299047810467, "loss": 0.0724, "step": 54930 }, { "epoch": 1.38, "learning_rate": 0.0009295530487651685, "loss": 0.0689, "step": 54940 }, { "epoch": 1.38, "learning_rate": 0.0009291761927492903, "loss": 0.0714, "step": 54950 }, { "epoch": 1.38, "learning_rate": 0.000928799336733412, "loss": 0.0718, "step": 54960 }, { "epoch": 1.38, "learning_rate": 0.0009284224807175338, "loss": 0.0682, "step": 54970 }, { "epoch": 1.38, "learning_rate": 0.0009280456247016556, "loss": 0.0673, "step": 54980 }, { "epoch": 1.38, "learning_rate": 0.0009276687686857774, "loss": 0.0715, "step": 54990 }, { "epoch": 1.38, "learning_rate": 0.0009272919126698992, "loss": 0.0736, "step": 55000 }, { "epoch": 1.38, "eval_cer": 0.6655213384747982, "eval_loss": 0.059801023453474045, "eval_runtime": 90.8051, "eval_samples_per_second": 110.115, "eval_steps_per_second": 6.883, "step": 55000 }, { "epoch": 1.38, "learning_rate": 0.000926915056654021, "loss": 0.074, "step": 55010 }, { "epoch": 1.38, "learning_rate": 0.0009265382006381428, "loss": 0.0714, "step": 55020 }, { "epoch": 1.38, "learning_rate": 0.0009261613446222648, "loss": 0.0728, "step": 55030 }, { "epoch": 1.38, "learning_rate": 0.0009257844886063864, "loss": 0.0733, "step": 55040 }, { "epoch": 1.38, "learning_rate": 0.0009254076325905083, "loss": 0.0697, "step": 55050 }, { "epoch": 1.38, "learning_rate": 0.00092503077657463, "loss": 0.0711, "step": 55060 }, { "epoch": 1.38, "learning_rate": 0.000924653920558752, "loss": 0.0707, "step": 55070 }, { "epoch": 1.38, "learning_rate": 0.0009242770645428736, "loss": 0.0692, "step": 55080 }, { "epoch": 1.38, "learning_rate": 0.0009239002085269955, "loss": 0.071, "step": 55090 }, { "epoch": 1.38, "learning_rate": 0.0009235233525111173, "loss": 0.0689, "step": 55100 }, { "epoch": 1.38, "learning_rate": 0.0009231464964952391, "loss": 0.0699, "step": 55110 }, { "epoch": 1.38, "learning_rate": 0.0009227696404793609, "loss": 0.0722, "step": 55120 }, { "epoch": 1.39, "learning_rate": 0.0009223927844634827, "loss": 0.0718, "step": 55130 }, { "epoch": 1.39, "learning_rate": 0.0009220159284476045, "loss": 0.069, "step": 55140 }, { "epoch": 1.39, "learning_rate": 0.0009216390724317263, "loss": 0.0707, "step": 55150 }, { "epoch": 1.39, "learning_rate": 0.0009212622164158481, "loss": 0.0696, "step": 55160 }, { "epoch": 1.39, "learning_rate": 0.0009208853603999699, "loss": 0.0671, "step": 55170 }, { "epoch": 1.39, "learning_rate": 0.0009205085043840917, "loss": 0.0723, "step": 55180 }, { "epoch": 1.39, "learning_rate": 0.0009201316483682134, "loss": 0.0706, "step": 55190 }, { "epoch": 1.39, "learning_rate": 0.0009197547923523353, "loss": 0.0695, "step": 55200 }, { "epoch": 1.39, "learning_rate": 0.000919377936336457, "loss": 0.0707, "step": 55210 }, { "epoch": 1.39, "learning_rate": 0.0009190010803205789, "loss": 0.0723, "step": 55220 }, { "epoch": 1.39, "learning_rate": 0.0009186242243047006, "loss": 0.0666, "step": 55230 }, { "epoch": 1.39, "learning_rate": 0.0009182473682888225, "loss": 0.0687, "step": 55240 }, { "epoch": 1.39, "learning_rate": 0.0009178705122729442, "loss": 0.0699, "step": 55250 }, { "epoch": 1.39, "learning_rate": 0.0009174936562570661, "loss": 0.0686, "step": 55260 }, { "epoch": 1.39, "learning_rate": 0.0009171168002411878, "loss": 0.0704, "step": 55270 }, { "epoch": 1.39, "learning_rate": 0.0009167399442253097, "loss": 0.0706, "step": 55280 }, { "epoch": 1.39, "learning_rate": 0.0009163630882094314, "loss": 0.0693, "step": 55290 }, { "epoch": 1.39, "learning_rate": 0.0009159862321935533, "loss": 0.0702, "step": 55300 }, { "epoch": 1.39, "learning_rate": 0.000915609376177675, "loss": 0.0685, "step": 55310 }, { "epoch": 1.39, "learning_rate": 0.000915232520161797, "loss": 0.0718, "step": 55320 }, { "epoch": 1.39, "learning_rate": 0.0009148556641459186, "loss": 0.0691, "step": 55330 }, { "epoch": 1.39, "learning_rate": 0.0009144788081300406, "loss": 0.0696, "step": 55340 }, { "epoch": 1.39, "learning_rate": 0.0009141019521141622, "loss": 0.0705, "step": 55350 }, { "epoch": 1.39, "learning_rate": 0.0009137250960982842, "loss": 0.0708, "step": 55360 }, { "epoch": 1.39, "learning_rate": 0.0009133482400824058, "loss": 0.0705, "step": 55370 }, { "epoch": 1.39, "learning_rate": 0.0009129713840665278, "loss": 0.0694, "step": 55380 }, { "epoch": 1.39, "learning_rate": 0.0009125945280506495, "loss": 0.0729, "step": 55390 }, { "epoch": 1.39, "learning_rate": 0.0009122176720347711, "loss": 0.0701, "step": 55400 }, { "epoch": 1.39, "learning_rate": 0.0009118408160188931, "loss": 0.0708, "step": 55410 }, { "epoch": 1.39, "learning_rate": 0.0009114639600030147, "loss": 0.0693, "step": 55420 }, { "epoch": 1.39, "learning_rate": 0.0009110871039871367, "loss": 0.0724, "step": 55430 }, { "epoch": 1.39, "learning_rate": 0.0009107102479712584, "loss": 0.072, "step": 55440 }, { "epoch": 1.39, "learning_rate": 0.0009103333919553803, "loss": 0.0703, "step": 55450 }, { "epoch": 1.39, "learning_rate": 0.000909956535939502, "loss": 0.0678, "step": 55460 }, { "epoch": 1.39, "learning_rate": 0.0009095796799236239, "loss": 0.0695, "step": 55470 }, { "epoch": 1.39, "learning_rate": 0.0009092028239077456, "loss": 0.0668, "step": 55480 }, { "epoch": 1.39, "learning_rate": 0.0009088259678918675, "loss": 0.0688, "step": 55490 }, { "epoch": 1.39, "learning_rate": 0.0009084491118759892, "loss": 0.0674, "step": 55500 }, { "epoch": 1.39, "eval_cer": 0.665315371892395, "eval_loss": 0.059912025928497314, "eval_runtime": 90.584, "eval_samples_per_second": 110.384, "eval_steps_per_second": 6.9, "step": 55500 }, { "epoch": 1.39, "learning_rate": 0.0009080722558601111, "loss": 0.0715, "step": 55510 }, { "epoch": 1.39, "learning_rate": 0.0009076953998442328, "loss": 0.0731, "step": 55520 }, { "epoch": 1.4, "learning_rate": 0.0009073185438283547, "loss": 0.0715, "step": 55530 }, { "epoch": 1.4, "learning_rate": 0.0009069416878124764, "loss": 0.07, "step": 55540 }, { "epoch": 1.4, "learning_rate": 0.0009065648317965983, "loss": 0.0687, "step": 55550 }, { "epoch": 1.4, "learning_rate": 0.00090618797578072, "loss": 0.0687, "step": 55560 }, { "epoch": 1.4, "learning_rate": 0.0009058111197648419, "loss": 0.0694, "step": 55570 }, { "epoch": 1.4, "learning_rate": 0.0009054342637489636, "loss": 0.0672, "step": 55580 }, { "epoch": 1.4, "learning_rate": 0.0009050574077330855, "loss": 0.0667, "step": 55590 }, { "epoch": 1.4, "learning_rate": 0.0009046805517172072, "loss": 0.072, "step": 55600 }, { "epoch": 1.4, "learning_rate": 0.0009043036957013292, "loss": 0.0723, "step": 55610 }, { "epoch": 1.4, "learning_rate": 0.0009039268396854508, "loss": 0.075, "step": 55620 }, { "epoch": 1.4, "learning_rate": 0.0009035499836695726, "loss": 0.069, "step": 55630 }, { "epoch": 1.4, "learning_rate": 0.0009031731276536944, "loss": 0.0707, "step": 55640 }, { "epoch": 1.4, "learning_rate": 0.0009027962716378162, "loss": 0.0713, "step": 55650 }, { "epoch": 1.4, "learning_rate": 0.0009024194156219381, "loss": 0.0738, "step": 55660 }, { "epoch": 1.4, "learning_rate": 0.0009020425596060598, "loss": 0.0692, "step": 55670 }, { "epoch": 1.4, "learning_rate": 0.0009016657035901817, "loss": 0.0703, "step": 55680 }, { "epoch": 1.4, "learning_rate": 0.0009012888475743034, "loss": 0.0706, "step": 55690 }, { "epoch": 1.4, "learning_rate": 0.0009009119915584253, "loss": 0.0711, "step": 55700 }, { "epoch": 1.4, "learning_rate": 0.000900535135542547, "loss": 0.0732, "step": 55710 }, { "epoch": 1.4, "learning_rate": 0.0009001582795266689, "loss": 0.0699, "step": 55720 }, { "epoch": 1.4, "learning_rate": 0.0008997814235107907, "loss": 0.0732, "step": 55730 }, { "epoch": 1.4, "learning_rate": 0.0008994045674949125, "loss": 0.0711, "step": 55740 }, { "epoch": 1.4, "learning_rate": 0.0008990277114790343, "loss": 0.069, "step": 55750 }, { "epoch": 1.4, "learning_rate": 0.0008986508554631561, "loss": 0.0747, "step": 55760 }, { "epoch": 1.4, "learning_rate": 0.0008982739994472779, "loss": 0.0718, "step": 55770 }, { "epoch": 1.4, "learning_rate": 0.0008978971434313997, "loss": 0.0675, "step": 55780 }, { "epoch": 1.4, "learning_rate": 0.0008975202874155215, "loss": 0.0723, "step": 55790 }, { "epoch": 1.4, "learning_rate": 0.0008971434313996433, "loss": 0.0714, "step": 55800 }, { "epoch": 1.4, "learning_rate": 0.0008967665753837651, "loss": 0.0693, "step": 55810 }, { "epoch": 1.4, "learning_rate": 0.0008963897193678869, "loss": 0.069, "step": 55820 }, { "epoch": 1.4, "learning_rate": 0.0008960128633520087, "loss": 0.0718, "step": 55830 }, { "epoch": 1.4, "learning_rate": 0.0008956360073361305, "loss": 0.0678, "step": 55840 }, { "epoch": 1.4, "learning_rate": 0.0008952591513202523, "loss": 0.0672, "step": 55850 }, { "epoch": 1.4, "learning_rate": 0.000894882295304374, "loss": 0.0708, "step": 55860 }, { "epoch": 1.4, "learning_rate": 0.0008945054392884959, "loss": 0.0695, "step": 55870 }, { "epoch": 1.4, "learning_rate": 0.0008941285832726176, "loss": 0.0705, "step": 55880 }, { "epoch": 1.4, "learning_rate": 0.0008937517272567395, "loss": 0.0687, "step": 55890 }, { "epoch": 1.4, "learning_rate": 0.0008933748712408612, "loss": 0.0712, "step": 55900 }, { "epoch": 1.4, "learning_rate": 0.000892998015224983, "loss": 0.0717, "step": 55910 }, { "epoch": 1.4, "learning_rate": 0.0008926211592091048, "loss": 0.0693, "step": 55920 }, { "epoch": 1.41, "learning_rate": 0.0008922443031932266, "loss": 0.069, "step": 55930 }, { "epoch": 1.41, "learning_rate": 0.0008918674471773484, "loss": 0.0694, "step": 55940 }, { "epoch": 1.41, "learning_rate": 0.0008914905911614704, "loss": 0.0716, "step": 55950 }, { "epoch": 1.41, "learning_rate": 0.000891113735145592, "loss": 0.0703, "step": 55960 }, { "epoch": 1.41, "learning_rate": 0.000890736879129714, "loss": 0.0703, "step": 55970 }, { "epoch": 1.41, "learning_rate": 0.0008903600231138356, "loss": 0.0733, "step": 55980 }, { "epoch": 1.41, "learning_rate": 0.0008899831670979575, "loss": 0.0722, "step": 55990 }, { "epoch": 1.41, "learning_rate": 0.0008896063110820792, "loss": 0.0681, "step": 56000 }, { "epoch": 1.41, "eval_cer": 0.6655227821657964, "eval_loss": 0.059231605380773544, "eval_runtime": 90.4542, "eval_samples_per_second": 110.542, "eval_steps_per_second": 6.91, "step": 56000 }, { "epoch": 1.41, "learning_rate": 0.0008892294550662011, "loss": 0.0705, "step": 56010 }, { "epoch": 1.41, "learning_rate": 0.0008888525990503229, "loss": 0.0708, "step": 56020 }, { "epoch": 1.41, "learning_rate": 0.0008884757430344447, "loss": 0.0687, "step": 56030 }, { "epoch": 1.41, "learning_rate": 0.0008880988870185665, "loss": 0.0679, "step": 56040 }, { "epoch": 1.41, "learning_rate": 0.0008877220310026883, "loss": 0.0681, "step": 56050 }, { "epoch": 1.41, "learning_rate": 0.0008873451749868101, "loss": 0.0703, "step": 56060 }, { "epoch": 1.41, "learning_rate": 0.0008869683189709317, "loss": 0.0706, "step": 56070 }, { "epoch": 1.41, "learning_rate": 0.0008865914629550537, "loss": 0.0731, "step": 56080 }, { "epoch": 1.41, "learning_rate": 0.0008862146069391754, "loss": 0.0723, "step": 56090 }, { "epoch": 1.41, "learning_rate": 0.0008858377509232973, "loss": 0.0696, "step": 56100 }, { "epoch": 1.41, "learning_rate": 0.000885460894907419, "loss": 0.0691, "step": 56110 }, { "epoch": 1.41, "learning_rate": 0.0008850840388915409, "loss": 0.0697, "step": 56120 }, { "epoch": 1.41, "learning_rate": 0.0008847071828756626, "loss": 0.0686, "step": 56130 }, { "epoch": 1.41, "learning_rate": 0.0008843303268597845, "loss": 0.0689, "step": 56140 }, { "epoch": 1.41, "learning_rate": 0.0008839534708439062, "loss": 0.0694, "step": 56150 }, { "epoch": 1.41, "learning_rate": 0.0008835766148280281, "loss": 0.0686, "step": 56160 }, { "epoch": 1.41, "learning_rate": 0.0008831997588121498, "loss": 0.0716, "step": 56170 }, { "epoch": 1.41, "learning_rate": 0.0008828229027962717, "loss": 0.0738, "step": 56180 }, { "epoch": 1.41, "learning_rate": 0.0008824460467803934, "loss": 0.0708, "step": 56190 }, { "epoch": 1.41, "learning_rate": 0.0008820691907645153, "loss": 0.0705, "step": 56200 }, { "epoch": 1.41, "learning_rate": 0.000881692334748637, "loss": 0.0699, "step": 56210 }, { "epoch": 1.41, "learning_rate": 0.0008813154787327589, "loss": 0.0711, "step": 56220 }, { "epoch": 1.41, "learning_rate": 0.0008809386227168806, "loss": 0.0703, "step": 56230 }, { "epoch": 1.41, "learning_rate": 0.0008805617667010026, "loss": 0.0686, "step": 56240 }, { "epoch": 1.41, "learning_rate": 0.0008801849106851242, "loss": 0.0713, "step": 56250 }, { "epoch": 1.41, "learning_rate": 0.0008798080546692462, "loss": 0.0688, "step": 56260 }, { "epoch": 1.41, "learning_rate": 0.0008794311986533678, "loss": 0.0703, "step": 56270 }, { "epoch": 1.41, "learning_rate": 0.0008790543426374898, "loss": 0.0685, "step": 56280 }, { "epoch": 1.41, "learning_rate": 0.0008786774866216114, "loss": 0.0714, "step": 56290 }, { "epoch": 1.41, "learning_rate": 0.0008783006306057331, "loss": 0.0715, "step": 56300 }, { "epoch": 1.41, "learning_rate": 0.0008779237745898551, "loss": 0.0664, "step": 56310 }, { "epoch": 1.41, "learning_rate": 0.0008775469185739767, "loss": 0.0706, "step": 56320 }, { "epoch": 1.42, "learning_rate": 0.0008771700625580987, "loss": 0.0698, "step": 56330 }, { "epoch": 1.42, "learning_rate": 0.0008767932065422203, "loss": 0.0704, "step": 56340 }, { "epoch": 1.42, "learning_rate": 0.0008764163505263423, "loss": 0.0672, "step": 56350 }, { "epoch": 1.42, "learning_rate": 0.000876039494510464, "loss": 0.0731, "step": 56360 }, { "epoch": 1.42, "learning_rate": 0.0008756626384945859, "loss": 0.0681, "step": 56370 }, { "epoch": 1.42, "learning_rate": 0.0008752857824787076, "loss": 0.0683, "step": 56380 }, { "epoch": 1.42, "learning_rate": 0.0008749089264628295, "loss": 0.0711, "step": 56390 }, { "epoch": 1.42, "learning_rate": 0.0008745320704469512, "loss": 0.0711, "step": 56400 }, { "epoch": 1.42, "learning_rate": 0.0008741552144310731, "loss": 0.0723, "step": 56410 }, { "epoch": 1.42, "learning_rate": 0.0008737783584151948, "loss": 0.0676, "step": 56420 }, { "epoch": 1.42, "learning_rate": 0.0008734015023993167, "loss": 0.0705, "step": 56430 }, { "epoch": 1.42, "learning_rate": 0.0008730246463834384, "loss": 0.0724, "step": 56440 }, { "epoch": 1.42, "learning_rate": 0.0008726477903675603, "loss": 0.0676, "step": 56450 }, { "epoch": 1.42, "learning_rate": 0.000872270934351682, "loss": 0.0701, "step": 56460 }, { "epoch": 1.42, "learning_rate": 0.0008718940783358039, "loss": 0.0708, "step": 56470 }, { "epoch": 1.42, "learning_rate": 0.0008715172223199256, "loss": 0.0662, "step": 56480 }, { "epoch": 1.42, "learning_rate": 0.0008711403663040475, "loss": 0.0735, "step": 56490 }, { "epoch": 1.42, "learning_rate": 0.0008707635102881692, "loss": 0.07, "step": 56500 }, { "epoch": 1.42, "eval_cer": 0.6653206654260548, "eval_loss": 0.05919070169329643, "eval_runtime": 90.4988, "eval_samples_per_second": 110.488, "eval_steps_per_second": 6.906, "step": 56500 }, { "epoch": 1.42, "learning_rate": 0.0008703866542722911, "loss": 0.071, "step": 56510 }, { "epoch": 1.42, "learning_rate": 0.0008700097982564128, "loss": 0.0711, "step": 56520 }, { "epoch": 1.42, "learning_rate": 0.0008696329422405346, "loss": 0.0723, "step": 56530 }, { "epoch": 1.42, "learning_rate": 0.0008692560862246564, "loss": 0.0702, "step": 56540 }, { "epoch": 1.42, "learning_rate": 0.0008688792302087782, "loss": 0.0691, "step": 56550 }, { "epoch": 1.42, "learning_rate": 0.0008685023741929, "loss": 0.0707, "step": 56560 }, { "epoch": 1.42, "learning_rate": 0.0008681255181770218, "loss": 0.0702, "step": 56570 }, { "epoch": 1.42, "learning_rate": 0.0008677486621611436, "loss": 0.072, "step": 56580 }, { "epoch": 1.42, "learning_rate": 0.0008673718061452654, "loss": 0.0715, "step": 56590 }, { "epoch": 1.42, "learning_rate": 0.0008669949501293873, "loss": 0.0694, "step": 56600 }, { "epoch": 1.42, "learning_rate": 0.000866618094113509, "loss": 0.0682, "step": 56610 }, { "epoch": 1.42, "learning_rate": 0.0008662412380976309, "loss": 0.0685, "step": 56620 }, { "epoch": 1.42, "learning_rate": 0.0008658643820817526, "loss": 0.068, "step": 56630 }, { "epoch": 1.42, "learning_rate": 0.0008654875260658745, "loss": 0.066, "step": 56640 }, { "epoch": 1.42, "learning_rate": 0.0008651106700499963, "loss": 0.0713, "step": 56650 }, { "epoch": 1.42, "learning_rate": 0.0008647338140341181, "loss": 0.0654, "step": 56660 }, { "epoch": 1.42, "learning_rate": 0.0008643569580182399, "loss": 0.0682, "step": 56670 }, { "epoch": 1.42, "learning_rate": 0.0008639801020023617, "loss": 0.0673, "step": 56680 }, { "epoch": 1.42, "learning_rate": 0.0008636032459864835, "loss": 0.0668, "step": 56690 }, { "epoch": 1.42, "learning_rate": 0.0008632263899706053, "loss": 0.0708, "step": 56700 }, { "epoch": 1.42, "learning_rate": 0.0008628495339547271, "loss": 0.0666, "step": 56710 }, { "epoch": 1.42, "learning_rate": 0.0008624726779388489, "loss": 0.0719, "step": 56720 }, { "epoch": 1.43, "learning_rate": 0.0008620958219229707, "loss": 0.0704, "step": 56730 }, { "epoch": 1.43, "learning_rate": 0.0008617189659070924, "loss": 0.0675, "step": 56740 }, { "epoch": 1.43, "learning_rate": 0.0008613421098912143, "loss": 0.0689, "step": 56750 }, { "epoch": 1.43, "learning_rate": 0.000860965253875336, "loss": 0.0683, "step": 56760 }, { "epoch": 1.43, "learning_rate": 0.0008605883978594579, "loss": 0.0668, "step": 56770 }, { "epoch": 1.43, "learning_rate": 0.0008602115418435796, "loss": 0.0726, "step": 56780 }, { "epoch": 1.43, "learning_rate": 0.0008598346858277015, "loss": 0.0677, "step": 56790 }, { "epoch": 1.43, "learning_rate": 0.0008594578298118232, "loss": 0.0704, "step": 56800 }, { "epoch": 1.43, "learning_rate": 0.000859080973795945, "loss": 0.0705, "step": 56810 }, { "epoch": 1.43, "learning_rate": 0.0008587041177800668, "loss": 0.0696, "step": 56820 }, { "epoch": 1.43, "learning_rate": 0.0008583272617641887, "loss": 0.07, "step": 56830 }, { "epoch": 1.43, "learning_rate": 0.0008579504057483104, "loss": 0.0723, "step": 56840 }, { "epoch": 1.43, "learning_rate": 0.0008575735497324322, "loss": 0.0681, "step": 56850 }, { "epoch": 1.43, "learning_rate": 0.000857196693716554, "loss": 0.0662, "step": 56860 }, { "epoch": 1.43, "learning_rate": 0.0008568198377006758, "loss": 0.0682, "step": 56870 }, { "epoch": 1.43, "learning_rate": 0.0008564429816847976, "loss": 0.0712, "step": 56880 }, { "epoch": 1.43, "learning_rate": 0.0008560661256689196, "loss": 0.0707, "step": 56890 }, { "epoch": 1.43, "learning_rate": 0.0008556892696530412, "loss": 0.0727, "step": 56900 }, { "epoch": 1.43, "learning_rate": 0.0008553124136371631, "loss": 0.0705, "step": 56910 }, { "epoch": 1.43, "learning_rate": 0.0008549355576212848, "loss": 0.068, "step": 56920 }, { "epoch": 1.43, "learning_rate": 0.0008545587016054067, "loss": 0.0701, "step": 56930 }, { "epoch": 1.43, "learning_rate": 0.0008541818455895285, "loss": 0.0712, "step": 56940 }, { "epoch": 1.43, "learning_rate": 0.0008538049895736503, "loss": 0.0691, "step": 56950 }, { "epoch": 1.43, "learning_rate": 0.0008534281335577721, "loss": 0.0715, "step": 56960 }, { "epoch": 1.43, "learning_rate": 0.0008530512775418937, "loss": 0.0693, "step": 56970 }, { "epoch": 1.43, "learning_rate": 0.0008526744215260157, "loss": 0.0713, "step": 56980 }, { "epoch": 1.43, "learning_rate": 0.0008522975655101373, "loss": 0.0708, "step": 56990 }, { "epoch": 1.43, "learning_rate": 0.0008519207094942593, "loss": 0.0704, "step": 57000 }, { "epoch": 1.43, "eval_cer": 0.6655526184464249, "eval_loss": 0.05909842625260353, "eval_runtime": 90.4968, "eval_samples_per_second": 110.49, "eval_steps_per_second": 6.906, "step": 57000 }, { "epoch": 1.43, "learning_rate": 0.000851543853478381, "loss": 0.0703, "step": 57010 }, { "epoch": 1.43, "learning_rate": 0.0008511669974625029, "loss": 0.0675, "step": 57020 }, { "epoch": 1.43, "learning_rate": 0.0008507901414466246, "loss": 0.0671, "step": 57030 }, { "epoch": 1.43, "learning_rate": 0.0008504132854307465, "loss": 0.0711, "step": 57040 }, { "epoch": 1.43, "learning_rate": 0.0008500364294148682, "loss": 0.0675, "step": 57050 }, { "epoch": 1.43, "learning_rate": 0.0008496595733989901, "loss": 0.0713, "step": 57060 }, { "epoch": 1.43, "learning_rate": 0.0008492827173831118, "loss": 0.0689, "step": 57070 }, { "epoch": 1.43, "learning_rate": 0.0008489058613672337, "loss": 0.0674, "step": 57080 }, { "epoch": 1.43, "learning_rate": 0.0008485290053513554, "loss": 0.0687, "step": 57090 }, { "epoch": 1.43, "learning_rate": 0.0008481521493354773, "loss": 0.0704, "step": 57100 }, { "epoch": 1.43, "learning_rate": 0.000847775293319599, "loss": 0.0711, "step": 57110 }, { "epoch": 1.44, "learning_rate": 0.0008473984373037209, "loss": 0.0692, "step": 57120 }, { "epoch": 1.44, "learning_rate": 0.0008470215812878426, "loss": 0.0673, "step": 57130 }, { "epoch": 1.44, "learning_rate": 0.0008466447252719645, "loss": 0.0716, "step": 57140 }, { "epoch": 1.44, "learning_rate": 0.0008462678692560862, "loss": 0.0707, "step": 57150 }, { "epoch": 1.44, "learning_rate": 0.0008458910132402081, "loss": 0.0698, "step": 57160 }, { "epoch": 1.44, "learning_rate": 0.0008455141572243298, "loss": 0.069, "step": 57170 }, { "epoch": 1.44, "learning_rate": 0.0008451373012084516, "loss": 0.0683, "step": 57180 }, { "epoch": 1.44, "learning_rate": 0.0008447604451925734, "loss": 0.0663, "step": 57190 }, { "epoch": 1.44, "learning_rate": 0.0008443835891766952, "loss": 0.0678, "step": 57200 }, { "epoch": 1.44, "learning_rate": 0.000844006733160817, "loss": 0.0642, "step": 57210 }, { "epoch": 1.44, "learning_rate": 0.0008436298771449388, "loss": 0.068, "step": 57220 }, { "epoch": 1.44, "learning_rate": 0.0008432530211290607, "loss": 0.0674, "step": 57230 }, { "epoch": 1.44, "learning_rate": 0.0008428761651131823, "loss": 0.0709, "step": 57240 }, { "epoch": 1.44, "learning_rate": 0.0008424993090973043, "loss": 0.071, "step": 57250 }, { "epoch": 1.44, "learning_rate": 0.000842122453081426, "loss": 0.0688, "step": 57260 }, { "epoch": 1.44, "learning_rate": 0.0008417455970655479, "loss": 0.0658, "step": 57270 }, { "epoch": 1.44, "learning_rate": 0.0008413687410496695, "loss": 0.0731, "step": 57280 }, { "epoch": 1.44, "learning_rate": 0.0008409918850337915, "loss": 0.0689, "step": 57290 }, { "epoch": 1.44, "learning_rate": 0.0008406150290179132, "loss": 0.0702, "step": 57300 }, { "epoch": 1.44, "learning_rate": 0.0008402381730020351, "loss": 0.0701, "step": 57310 }, { "epoch": 1.44, "learning_rate": 0.0008398613169861568, "loss": 0.0686, "step": 57320 }, { "epoch": 1.44, "learning_rate": 0.0008394844609702787, "loss": 0.0696, "step": 57330 }, { "epoch": 1.44, "learning_rate": 0.0008391076049544004, "loss": 0.071, "step": 57340 }, { "epoch": 1.44, "learning_rate": 0.0008387307489385223, "loss": 0.0677, "step": 57350 }, { "epoch": 1.44, "learning_rate": 0.000838353892922644, "loss": 0.0688, "step": 57360 }, { "epoch": 1.44, "learning_rate": 0.0008379770369067659, "loss": 0.0669, "step": 57370 }, { "epoch": 1.44, "learning_rate": 0.0008376001808908876, "loss": 0.0696, "step": 57380 }, { "epoch": 1.44, "learning_rate": 0.0008372233248750095, "loss": 0.0704, "step": 57390 }, { "epoch": 1.44, "learning_rate": 0.0008368464688591312, "loss": 0.0708, "step": 57400 }, { "epoch": 1.44, "learning_rate": 0.000836469612843253, "loss": 0.0712, "step": 57410 }, { "epoch": 1.44, "learning_rate": 0.0008360927568273748, "loss": 0.0688, "step": 57420 }, { "epoch": 1.44, "learning_rate": 0.0008357159008114966, "loss": 0.0688, "step": 57430 }, { "epoch": 1.44, "learning_rate": 0.0008353390447956184, "loss": 0.0703, "step": 57440 }, { "epoch": 1.44, "learning_rate": 0.0008349621887797402, "loss": 0.0675, "step": 57450 }, { "epoch": 1.44, "learning_rate": 0.000834585332763862, "loss": 0.0696, "step": 57460 }, { "epoch": 1.44, "learning_rate": 0.0008342084767479838, "loss": 0.0662, "step": 57470 }, { "epoch": 1.44, "learning_rate": 0.0008338316207321056, "loss": 0.0691, "step": 57480 }, { "epoch": 1.44, "learning_rate": 0.0008334547647162274, "loss": 0.071, "step": 57490 }, { "epoch": 1.44, "learning_rate": 0.0008330779087003492, "loss": 0.0719, "step": 57500 }, { "epoch": 1.44, "eval_cer": 0.6653355835663691, "eval_loss": 0.058829259127378464, "eval_runtime": 90.5112, "eval_samples_per_second": 110.473, "eval_steps_per_second": 6.905, "step": 57500 }, { "epoch": 1.44, "learning_rate": 0.000832701052684471, "loss": 0.0701, "step": 57510 }, { "epoch": 1.45, "learning_rate": 0.0008323241966685929, "loss": 0.0698, "step": 57520 }, { "epoch": 1.45, "learning_rate": 0.0008319473406527146, "loss": 0.0723, "step": 57530 }, { "epoch": 1.45, "learning_rate": 0.0008315704846368365, "loss": 0.0698, "step": 57540 }, { "epoch": 1.45, "learning_rate": 0.0008311936286209582, "loss": 0.0693, "step": 57550 }, { "epoch": 1.45, "learning_rate": 0.0008308167726050801, "loss": 0.0703, "step": 57560 }, { "epoch": 1.45, "learning_rate": 0.0008304399165892018, "loss": 0.0689, "step": 57570 }, { "epoch": 1.45, "learning_rate": 0.0008300630605733237, "loss": 0.0676, "step": 57580 }, { "epoch": 1.45, "learning_rate": 0.0008296862045574455, "loss": 0.0668, "step": 57590 }, { "epoch": 1.45, "learning_rate": 0.0008293093485415673, "loss": 0.0671, "step": 57600 }, { "epoch": 1.45, "learning_rate": 0.0008289324925256891, "loss": 0.0717, "step": 57610 }, { "epoch": 1.45, "learning_rate": 0.0008285556365098109, "loss": 0.0691, "step": 57620 }, { "epoch": 1.45, "learning_rate": 0.0008281787804939327, "loss": 0.0706, "step": 57630 }, { "epoch": 1.45, "learning_rate": 0.0008278019244780544, "loss": 0.0736, "step": 57640 }, { "epoch": 1.45, "learning_rate": 0.0008274250684621763, "loss": 0.0663, "step": 57650 }, { "epoch": 1.45, "learning_rate": 0.000827048212446298, "loss": 0.0708, "step": 57660 }, { "epoch": 1.45, "learning_rate": 0.0008266713564304199, "loss": 0.0745, "step": 57670 }, { "epoch": 1.45, "learning_rate": 0.0008262945004145416, "loss": 0.0712, "step": 57680 }, { "epoch": 1.45, "learning_rate": 0.0008259176443986635, "loss": 0.067, "step": 57690 }, { "epoch": 1.45, "learning_rate": 0.0008255407883827852, "loss": 0.0707, "step": 57700 }, { "epoch": 1.45, "learning_rate": 0.0008251639323669071, "loss": 0.0684, "step": 57710 }, { "epoch": 1.45, "learning_rate": 0.0008247870763510288, "loss": 0.07, "step": 57720 }, { "epoch": 1.45, "learning_rate": 0.0008244102203351507, "loss": 0.0695, "step": 57730 }, { "epoch": 1.45, "learning_rate": 0.0008240333643192724, "loss": 0.0666, "step": 57740 }, { "epoch": 1.45, "learning_rate": 0.0008236565083033943, "loss": 0.0733, "step": 57750 }, { "epoch": 1.45, "learning_rate": 0.000823279652287516, "loss": 0.0692, "step": 57760 }, { "epoch": 1.45, "learning_rate": 0.0008229027962716378, "loss": 0.0668, "step": 57770 }, { "epoch": 1.45, "learning_rate": 0.0008225259402557596, "loss": 0.0707, "step": 57780 }, { "epoch": 1.45, "learning_rate": 0.0008221490842398814, "loss": 0.0703, "step": 57790 }, { "epoch": 1.45, "learning_rate": 0.0008217722282240032, "loss": 0.0685, "step": 57800 }, { "epoch": 1.45, "learning_rate": 0.0008213953722081252, "loss": 0.0707, "step": 57810 }, { "epoch": 1.45, "learning_rate": 0.0008210185161922468, "loss": 0.0687, "step": 57820 }, { "epoch": 1.45, "learning_rate": 0.0008206416601763688, "loss": 0.0694, "step": 57830 }, { "epoch": 1.45, "learning_rate": 0.0008202648041604904, "loss": 0.0684, "step": 57840 }, { "epoch": 1.45, "learning_rate": 0.0008198879481446121, "loss": 0.0704, "step": 57850 }, { "epoch": 1.45, "learning_rate": 0.000819511092128734, "loss": 0.068, "step": 57860 }, { "epoch": 1.45, "learning_rate": 0.0008191342361128557, "loss": 0.0702, "step": 57870 }, { "epoch": 1.45, "learning_rate": 0.0008187573800969777, "loss": 0.0674, "step": 57880 }, { "epoch": 1.45, "learning_rate": 0.0008183805240810993, "loss": 0.0683, "step": 57890 }, { "epoch": 1.45, "learning_rate": 0.0008180036680652213, "loss": 0.0692, "step": 57900 }, { "epoch": 1.45, "learning_rate": 0.0008176268120493429, "loss": 0.0696, "step": 57910 }, { "epoch": 1.46, "learning_rate": 0.0008172499560334649, "loss": 0.0678, "step": 57920 }, { "epoch": 1.46, "learning_rate": 0.0008168731000175866, "loss": 0.0715, "step": 57930 }, { "epoch": 1.46, "learning_rate": 0.0008164962440017085, "loss": 0.0721, "step": 57940 }, { "epoch": 1.46, "learning_rate": 0.0008161193879858302, "loss": 0.0677, "step": 57950 }, { "epoch": 1.46, "learning_rate": 0.0008157425319699521, "loss": 0.0688, "step": 57960 }, { "epoch": 1.46, "learning_rate": 0.0008153656759540738, "loss": 0.0709, "step": 57970 }, { "epoch": 1.46, "learning_rate": 0.0008149888199381957, "loss": 0.0701, "step": 57980 }, { "epoch": 1.46, "learning_rate": 0.0008146119639223174, "loss": 0.0693, "step": 57990 }, { "epoch": 1.46, "learning_rate": 0.0008142351079064393, "loss": 0.0667, "step": 58000 }, { "epoch": 1.46, "eval_cer": 0.6652869793027646, "eval_loss": 0.058723725378513336, "eval_runtime": 90.5517, "eval_samples_per_second": 110.423, "eval_steps_per_second": 6.902, "step": 58000 }, { "epoch": 1.46, "learning_rate": 0.000813858251890561, "loss": 0.0663, "step": 58010 }, { "epoch": 1.46, "learning_rate": 0.0008134813958746829, "loss": 0.0664, "step": 58020 }, { "epoch": 1.46, "learning_rate": 0.0008131045398588046, "loss": 0.0718, "step": 58030 }, { "epoch": 1.46, "learning_rate": 0.0008127276838429265, "loss": 0.0731, "step": 58040 }, { "epoch": 1.46, "learning_rate": 0.0008123508278270482, "loss": 0.0666, "step": 58050 }, { "epoch": 1.46, "learning_rate": 0.0008119739718111701, "loss": 0.0696, "step": 58060 }, { "epoch": 1.46, "learning_rate": 0.0008115971157952918, "loss": 0.0671, "step": 58070 }, { "epoch": 1.46, "learning_rate": 0.0008112202597794136, "loss": 0.0664, "step": 58080 }, { "epoch": 1.46, "learning_rate": 0.0008108434037635354, "loss": 0.0686, "step": 58090 }, { "epoch": 1.46, "learning_rate": 0.0008104665477476572, "loss": 0.0685, "step": 58100 }, { "epoch": 1.46, "learning_rate": 0.000810089691731779, "loss": 0.071, "step": 58110 }, { "epoch": 1.46, "learning_rate": 0.0008097128357159008, "loss": 0.0643, "step": 58120 }, { "epoch": 1.46, "learning_rate": 0.0008093359797000226, "loss": 0.0684, "step": 58130 }, { "epoch": 1.46, "learning_rate": 0.0008089591236841444, "loss": 0.0697, "step": 58140 }, { "epoch": 1.46, "learning_rate": 0.0008085822676682662, "loss": 0.0708, "step": 58150 }, { "epoch": 1.46, "learning_rate": 0.000808205411652388, "loss": 0.0678, "step": 58160 }, { "epoch": 1.46, "learning_rate": 0.0008078285556365099, "loss": 0.0682, "step": 58170 }, { "epoch": 1.46, "learning_rate": 0.0008074516996206315, "loss": 0.0681, "step": 58180 }, { "epoch": 1.46, "learning_rate": 0.0008070748436047535, "loss": 0.0668, "step": 58190 }, { "epoch": 1.46, "learning_rate": 0.0008066979875888751, "loss": 0.07, "step": 58200 }, { "epoch": 1.46, "learning_rate": 0.0008063211315729971, "loss": 0.0689, "step": 58210 }, { "epoch": 1.46, "learning_rate": 0.0008059442755571189, "loss": 0.069, "step": 58220 }, { "epoch": 1.46, "learning_rate": 0.0008055674195412407, "loss": 0.0717, "step": 58230 }, { "epoch": 1.46, "learning_rate": 0.0008051905635253624, "loss": 0.0697, "step": 58240 }, { "epoch": 1.46, "learning_rate": 0.0008048137075094843, "loss": 0.0678, "step": 58250 }, { "epoch": 1.46, "learning_rate": 0.000804436851493606, "loss": 0.0652, "step": 58260 }, { "epoch": 1.46, "learning_rate": 0.0008040599954777279, "loss": 0.0689, "step": 58270 }, { "epoch": 1.46, "learning_rate": 0.0008036831394618496, "loss": 0.0715, "step": 58280 }, { "epoch": 1.46, "learning_rate": 0.0008033062834459715, "loss": 0.0672, "step": 58290 }, { "epoch": 1.46, "learning_rate": 0.0008029294274300932, "loss": 0.0701, "step": 58300 }, { "epoch": 1.46, "learning_rate": 0.000802552571414215, "loss": 0.0684, "step": 58310 }, { "epoch": 1.47, "learning_rate": 0.0008021757153983368, "loss": 0.0669, "step": 58320 }, { "epoch": 1.47, "learning_rate": 0.0008017988593824586, "loss": 0.0674, "step": 58330 }, { "epoch": 1.47, "learning_rate": 0.0008014220033665804, "loss": 0.0695, "step": 58340 }, { "epoch": 1.47, "learning_rate": 0.0008010451473507022, "loss": 0.066, "step": 58350 }, { "epoch": 1.47, "learning_rate": 0.000800668291334824, "loss": 0.0672, "step": 58360 }, { "epoch": 1.47, "learning_rate": 0.0008002914353189458, "loss": 0.0698, "step": 58370 }, { "epoch": 1.47, "learning_rate": 0.0007999145793030676, "loss": 0.0669, "step": 58380 }, { "epoch": 1.47, "learning_rate": 0.0007995377232871894, "loss": 0.0664, "step": 58390 }, { "epoch": 1.47, "learning_rate": 0.0007991608672713112, "loss": 0.0687, "step": 58400 }, { "epoch": 1.47, "learning_rate": 0.000798784011255433, "loss": 0.0633, "step": 58410 }, { "epoch": 1.47, "learning_rate": 0.0007984071552395548, "loss": 0.0722, "step": 58420 }, { "epoch": 1.47, "learning_rate": 0.0007980302992236766, "loss": 0.0679, "step": 58430 }, { "epoch": 1.47, "learning_rate": 0.0007976534432077984, "loss": 0.07, "step": 58440 }, { "epoch": 1.47, "learning_rate": 0.0007972765871919202, "loss": 0.0702, "step": 58450 }, { "epoch": 1.47, "learning_rate": 0.0007968997311760421, "loss": 0.0662, "step": 58460 }, { "epoch": 1.47, "learning_rate": 0.0007965228751601638, "loss": 0.0692, "step": 58470 }, { "epoch": 1.47, "learning_rate": 0.0007961460191442857, "loss": 0.0649, "step": 58480 }, { "epoch": 1.47, "learning_rate": 0.0007957691631284074, "loss": 0.0691, "step": 58490 }, { "epoch": 1.47, "learning_rate": 0.0007953923071125293, "loss": 0.0694, "step": 58500 }, { "epoch": 1.47, "eval_cer": 0.6653269214203802, "eval_loss": 0.05830288305878639, "eval_runtime": 90.732, "eval_samples_per_second": 110.204, "eval_steps_per_second": 6.888, "step": 58500 }, { "epoch": 1.47, "learning_rate": 0.0007950154510966511, "loss": 0.0678, "step": 58510 }, { "epoch": 1.47, "learning_rate": 0.0007946385950807727, "loss": 0.0685, "step": 58520 }, { "epoch": 1.47, "learning_rate": 0.0007942617390648947, "loss": 0.0665, "step": 58530 }, { "epoch": 1.47, "learning_rate": 0.0007938848830490163, "loss": 0.0687, "step": 58540 }, { "epoch": 1.47, "learning_rate": 0.0007935080270331383, "loss": 0.0717, "step": 58550 }, { "epoch": 1.47, "learning_rate": 0.0007931311710172599, "loss": 0.0654, "step": 58560 }, { "epoch": 1.47, "learning_rate": 0.0007927543150013819, "loss": 0.0671, "step": 58570 }, { "epoch": 1.47, "learning_rate": 0.0007923774589855036, "loss": 0.0703, "step": 58580 }, { "epoch": 1.47, "learning_rate": 0.0007920006029696255, "loss": 0.0691, "step": 58590 }, { "epoch": 1.47, "learning_rate": 0.0007916237469537472, "loss": 0.0692, "step": 58600 }, { "epoch": 1.47, "learning_rate": 0.0007912468909378691, "loss": 0.066, "step": 58610 }, { "epoch": 1.47, "learning_rate": 0.0007908700349219908, "loss": 0.0667, "step": 58620 }, { "epoch": 1.47, "learning_rate": 0.0007904931789061127, "loss": 0.0678, "step": 58630 }, { "epoch": 1.47, "learning_rate": 0.0007901163228902344, "loss": 0.0698, "step": 58640 }, { "epoch": 1.47, "learning_rate": 0.0007897394668743563, "loss": 0.0684, "step": 58650 }, { "epoch": 1.47, "learning_rate": 0.000789362610858478, "loss": 0.0677, "step": 58660 }, { "epoch": 1.47, "learning_rate": 0.0007889857548425999, "loss": 0.0695, "step": 58670 }, { "epoch": 1.47, "learning_rate": 0.0007886088988267216, "loss": 0.0644, "step": 58680 }, { "epoch": 1.47, "learning_rate": 0.0007882320428108435, "loss": 0.066, "step": 58690 }, { "epoch": 1.47, "learning_rate": 0.0007878551867949652, "loss": 0.068, "step": 58700 }, { "epoch": 1.47, "learning_rate": 0.000787478330779087, "loss": 0.0684, "step": 58710 }, { "epoch": 1.48, "learning_rate": 0.0007871014747632088, "loss": 0.0709, "step": 58720 }, { "epoch": 1.48, "learning_rate": 0.0007867246187473308, "loss": 0.0706, "step": 58730 }, { "epoch": 1.48, "learning_rate": 0.0007863477627314524, "loss": 0.0724, "step": 58740 }, { "epoch": 1.48, "learning_rate": 0.0007859709067155741, "loss": 0.0707, "step": 58750 }, { "epoch": 1.48, "learning_rate": 0.000785594050699696, "loss": 0.0661, "step": 58760 }, { "epoch": 1.48, "learning_rate": 0.0007852171946838177, "loss": 0.0663, "step": 58770 }, { "epoch": 1.48, "learning_rate": 0.0007848403386679396, "loss": 0.0678, "step": 58780 }, { "epoch": 1.48, "learning_rate": 0.0007844634826520613, "loss": 0.0678, "step": 58790 }, { "epoch": 1.48, "learning_rate": 0.0007840866266361833, "loss": 0.0676, "step": 58800 }, { "epoch": 1.48, "learning_rate": 0.0007837097706203049, "loss": 0.0677, "step": 58810 }, { "epoch": 1.48, "learning_rate": 0.0007833329146044269, "loss": 0.0691, "step": 58820 }, { "epoch": 1.48, "learning_rate": 0.0007829560585885485, "loss": 0.068, "step": 58830 }, { "epoch": 1.48, "learning_rate": 0.0007825792025726705, "loss": 0.0702, "step": 58840 }, { "epoch": 1.48, "learning_rate": 0.0007822023465567921, "loss": 0.0686, "step": 58850 }, { "epoch": 1.48, "learning_rate": 0.0007818254905409141, "loss": 0.0674, "step": 58860 }, { "epoch": 1.48, "learning_rate": 0.0007814486345250358, "loss": 0.0677, "step": 58870 }, { "epoch": 1.48, "learning_rate": 0.0007810717785091577, "loss": 0.0682, "step": 58880 }, { "epoch": 1.48, "learning_rate": 0.0007806949224932794, "loss": 0.0694, "step": 58890 }, { "epoch": 1.48, "learning_rate": 0.0007803180664774013, "loss": 0.0678, "step": 58900 }, { "epoch": 1.48, "learning_rate": 0.000779941210461523, "loss": 0.0662, "step": 58910 }, { "epoch": 1.48, "learning_rate": 0.0007795643544456449, "loss": 0.0691, "step": 58920 }, { "epoch": 1.48, "learning_rate": 0.0007791874984297666, "loss": 0.069, "step": 58930 }, { "epoch": 1.48, "learning_rate": 0.0007788106424138885, "loss": 0.0671, "step": 58940 }, { "epoch": 1.48, "learning_rate": 0.0007784337863980102, "loss": 0.0676, "step": 58950 }, { "epoch": 1.48, "learning_rate": 0.000778056930382132, "loss": 0.0716, "step": 58960 }, { "epoch": 1.48, "learning_rate": 0.0007776800743662538, "loss": 0.0661, "step": 58970 }, { "epoch": 1.48, "learning_rate": 0.0007773032183503756, "loss": 0.0663, "step": 58980 }, { "epoch": 1.48, "learning_rate": 0.0007769263623344974, "loss": 0.0721, "step": 58990 }, { "epoch": 1.48, "learning_rate": 0.0007765495063186192, "loss": 0.0709, "step": 59000 }, { "epoch": 1.48, "eval_cer": 0.6655189323231346, "eval_loss": 0.05791353061795235, "eval_runtime": 90.8528, "eval_samples_per_second": 110.057, "eval_steps_per_second": 6.879, "step": 59000 }, { "epoch": 1.48, "learning_rate": 0.000776172650302741, "loss": 0.067, "step": 59010 }, { "epoch": 1.48, "learning_rate": 0.0007757957942868628, "loss": 0.0698, "step": 59020 }, { "epoch": 1.48, "learning_rate": 0.0007754189382709846, "loss": 0.0648, "step": 59030 }, { "epoch": 1.48, "learning_rate": 0.0007750420822551064, "loss": 0.072, "step": 59040 }, { "epoch": 1.48, "learning_rate": 0.0007746652262392282, "loss": 0.0671, "step": 59050 }, { "epoch": 1.48, "learning_rate": 0.00077428837022335, "loss": 0.0685, "step": 59060 }, { "epoch": 1.48, "learning_rate": 0.0007739115142074718, "loss": 0.0673, "step": 59070 }, { "epoch": 1.48, "learning_rate": 0.0007735346581915936, "loss": 0.0664, "step": 59080 }, { "epoch": 1.48, "learning_rate": 0.0007731578021757155, "loss": 0.0675, "step": 59090 }, { "epoch": 1.48, "learning_rate": 0.0007727809461598371, "loss": 0.0644, "step": 59100 }, { "epoch": 1.49, "learning_rate": 0.0007724040901439591, "loss": 0.0687, "step": 59110 }, { "epoch": 1.49, "learning_rate": 0.0007720272341280807, "loss": 0.0703, "step": 59120 }, { "epoch": 1.49, "learning_rate": 0.0007716503781122027, "loss": 0.0687, "step": 59130 }, { "epoch": 1.49, "learning_rate": 0.0007712735220963245, "loss": 0.0705, "step": 59140 }, { "epoch": 1.49, "learning_rate": 0.0007708966660804463, "loss": 0.07, "step": 59150 }, { "epoch": 1.49, "learning_rate": 0.000770519810064568, "loss": 0.0704, "step": 59160 }, { "epoch": 1.49, "learning_rate": 0.0007701429540486899, "loss": 0.0653, "step": 59170 }, { "epoch": 1.49, "learning_rate": 0.0007697660980328116, "loss": 0.0672, "step": 59180 }, { "epoch": 1.49, "learning_rate": 0.0007693892420169333, "loss": 0.0728, "step": 59190 }, { "epoch": 1.49, "learning_rate": 0.0007690123860010552, "loss": 0.065, "step": 59200 }, { "epoch": 1.49, "learning_rate": 0.000768635529985177, "loss": 0.0676, "step": 59210 }, { "epoch": 1.49, "learning_rate": 0.0007682586739692988, "loss": 0.0692, "step": 59220 }, { "epoch": 1.49, "learning_rate": 0.0007678818179534206, "loss": 0.068, "step": 59230 }, { "epoch": 1.49, "learning_rate": 0.0007675049619375424, "loss": 0.0699, "step": 59240 }, { "epoch": 1.49, "learning_rate": 0.0007671281059216642, "loss": 0.0665, "step": 59250 }, { "epoch": 1.49, "learning_rate": 0.000766751249905786, "loss": 0.067, "step": 59260 }, { "epoch": 1.49, "learning_rate": 0.0007663743938899078, "loss": 0.0695, "step": 59270 }, { "epoch": 1.49, "learning_rate": 0.0007659975378740296, "loss": 0.0686, "step": 59280 }, { "epoch": 1.49, "learning_rate": 0.0007656206818581514, "loss": 0.0672, "step": 59290 }, { "epoch": 1.49, "learning_rate": 0.0007652438258422732, "loss": 0.0696, "step": 59300 }, { "epoch": 1.49, "learning_rate": 0.000764866969826395, "loss": 0.0683, "step": 59310 }, { "epoch": 1.49, "learning_rate": 0.0007644901138105168, "loss": 0.0688, "step": 59320 }, { "epoch": 1.49, "learning_rate": 0.0007641132577946386, "loss": 0.0678, "step": 59330 }, { "epoch": 1.49, "learning_rate": 0.0007637364017787604, "loss": 0.0669, "step": 59340 }, { "epoch": 1.49, "learning_rate": 0.0007633595457628822, "loss": 0.0649, "step": 59350 }, { "epoch": 1.49, "learning_rate": 0.000762982689747004, "loss": 0.0686, "step": 59360 }, { "epoch": 1.49, "learning_rate": 0.0007626058337311258, "loss": 0.0664, "step": 59370 }, { "epoch": 1.49, "learning_rate": 0.0007622289777152477, "loss": 0.0705, "step": 59380 }, { "epoch": 1.49, "learning_rate": 0.0007618521216993694, "loss": 0.0707, "step": 59390 }, { "epoch": 1.49, "learning_rate": 0.0007614752656834913, "loss": 0.0661, "step": 59400 }, { "epoch": 1.49, "learning_rate": 0.000761098409667613, "loss": 0.0675, "step": 59410 }, { "epoch": 1.49, "learning_rate": 0.0007607215536517347, "loss": 0.0721, "step": 59420 }, { "epoch": 1.49, "learning_rate": 0.0007603446976358567, "loss": 0.0701, "step": 59430 }, { "epoch": 1.49, "learning_rate": 0.0007599678416199783, "loss": 0.0692, "step": 59440 }, { "epoch": 1.49, "learning_rate": 0.0007595909856041003, "loss": 0.0692, "step": 59450 }, { "epoch": 1.49, "learning_rate": 0.0007592141295882219, "loss": 0.0671, "step": 59460 }, { "epoch": 1.49, "learning_rate": 0.0007588372735723439, "loss": 0.0707, "step": 59470 }, { "epoch": 1.49, "learning_rate": 0.0007584604175564655, "loss": 0.0657, "step": 59480 }, { "epoch": 1.49, "learning_rate": 0.0007580835615405875, "loss": 0.0668, "step": 59490 }, { "epoch": 1.49, "learning_rate": 0.0007577067055247092, "loss": 0.0661, "step": 59500 }, { "epoch": 1.49, "eval_cer": 0.6654530037675522, "eval_loss": 0.05784814804792404, "eval_runtime": 90.4465, "eval_samples_per_second": 110.552, "eval_steps_per_second": 6.91, "step": 59500 }, { "epoch": 1.5, "learning_rate": 0.0007573298495088311, "loss": 0.0689, "step": 59510 }, { "epoch": 1.5, "learning_rate": 0.0007569529934929528, "loss": 0.0678, "step": 59520 }, { "epoch": 1.5, "learning_rate": 0.0007565761374770747, "loss": 0.0683, "step": 59530 }, { "epoch": 1.5, "learning_rate": 0.0007561992814611964, "loss": 0.0712, "step": 59540 }, { "epoch": 1.5, "learning_rate": 0.0007558224254453183, "loss": 0.0658, "step": 59550 }, { "epoch": 1.5, "learning_rate": 0.00075544556942944, "loss": 0.0672, "step": 59560 }, { "epoch": 1.5, "learning_rate": 0.0007550687134135619, "loss": 0.0662, "step": 59570 }, { "epoch": 1.5, "learning_rate": 0.0007546918573976836, "loss": 0.0709, "step": 59580 }, { "epoch": 1.5, "learning_rate": 0.0007543150013818055, "loss": 0.0666, "step": 59590 }, { "epoch": 1.5, "learning_rate": 0.0007539381453659272, "loss": 0.0676, "step": 59600 }, { "epoch": 1.5, "learning_rate": 0.000753561289350049, "loss": 0.0709, "step": 59610 }, { "epoch": 1.5, "learning_rate": 0.0007531844333341708, "loss": 0.0698, "step": 59620 }, { "epoch": 1.5, "learning_rate": 0.0007528075773182925, "loss": 0.0671, "step": 59630 }, { "epoch": 1.5, "learning_rate": 0.0007524307213024144, "loss": 0.0737, "step": 59640 }, { "epoch": 1.5, "learning_rate": 0.0007520538652865361, "loss": 0.0681, "step": 59650 }, { "epoch": 1.5, "learning_rate": 0.000751677009270658, "loss": 0.0679, "step": 59660 }, { "epoch": 1.5, "learning_rate": 0.0007513001532547797, "loss": 0.0661, "step": 59670 }, { "epoch": 1.5, "learning_rate": 0.0007509232972389016, "loss": 0.0725, "step": 59680 }, { "epoch": 1.5, "learning_rate": 0.0007505464412230233, "loss": 0.0681, "step": 59690 }, { "epoch": 1.5, "learning_rate": 0.0007501695852071452, "loss": 0.0677, "step": 59700 }, { "epoch": 1.5, "learning_rate": 0.000749792729191267, "loss": 0.0694, "step": 59710 }, { "epoch": 1.5, "learning_rate": 0.0007494158731753889, "loss": 0.0684, "step": 59720 }, { "epoch": 1.5, "learning_rate": 0.0007490390171595106, "loss": 0.0678, "step": 59730 }, { "epoch": 1.5, "learning_rate": 0.0007486621611436324, "loss": 0.0685, "step": 59740 }, { "epoch": 1.5, "learning_rate": 0.0007482853051277541, "loss": 0.0681, "step": 59750 }, { "epoch": 1.5, "learning_rate": 0.000747908449111876, "loss": 0.0665, "step": 59760 }, { "epoch": 1.5, "learning_rate": 0.0007475315930959977, "loss": 0.0667, "step": 59770 }, { "epoch": 1.5, "learning_rate": 0.0007471547370801196, "loss": 0.0655, "step": 59780 }, { "epoch": 1.5, "learning_rate": 0.0007467778810642414, "loss": 0.0664, "step": 59790 }, { "epoch": 1.5, "learning_rate": 0.0007464010250483632, "loss": 0.0687, "step": 59800 }, { "epoch": 1.5, "learning_rate": 0.000746024169032485, "loss": 0.0664, "step": 59810 }, { "epoch": 1.5, "learning_rate": 0.0007456473130166068, "loss": 0.068, "step": 59820 }, { "epoch": 1.5, "learning_rate": 0.0007452704570007286, "loss": 0.0693, "step": 59830 }, { "epoch": 1.5, "learning_rate": 0.0007448936009848504, "loss": 0.0672, "step": 59840 }, { "epoch": 1.5, "learning_rate": 0.0007445167449689722, "loss": 0.0705, "step": 59850 }, { "epoch": 1.5, "learning_rate": 0.000744139888953094, "loss": 0.0661, "step": 59860 }, { "epoch": 1.5, "learning_rate": 0.0007437630329372158, "loss": 0.0674, "step": 59870 }, { "epoch": 1.5, "learning_rate": 0.0007433861769213376, "loss": 0.0716, "step": 59880 }, { "epoch": 1.5, "learning_rate": 0.0007430093209054594, "loss": 0.0687, "step": 59890 }, { "epoch": 1.5, "learning_rate": 0.0007426324648895813, "loss": 0.0663, "step": 59900 }, { "epoch": 1.51, "learning_rate": 0.000742255608873703, "loss": 0.0694, "step": 59910 }, { "epoch": 1.51, "learning_rate": 0.0007418787528578249, "loss": 0.0667, "step": 59920 }, { "epoch": 1.51, "learning_rate": 0.0007415018968419466, "loss": 0.0679, "step": 59930 }, { "epoch": 1.51, "learning_rate": 0.0007411250408260685, "loss": 0.0711, "step": 59940 }, { "epoch": 1.51, "learning_rate": 0.0007407481848101902, "loss": 0.0689, "step": 59950 }, { "epoch": 1.51, "learning_rate": 0.0007403713287943121, "loss": 0.0662, "step": 59960 }, { "epoch": 1.51, "learning_rate": 0.0007399944727784338, "loss": 0.0675, "step": 59970 }, { "epoch": 1.51, "learning_rate": 0.0007396176167625556, "loss": 0.0701, "step": 59980 }, { "epoch": 1.51, "learning_rate": 0.0007392407607466774, "loss": 0.0718, "step": 59990 }, { "epoch": 1.51, "learning_rate": 0.0007388639047307992, "loss": 0.0682, "step": 60000 }, { "epoch": 1.51, "eval_cer": 0.6654611846832085, "eval_loss": 0.05754994973540306, "eval_runtime": 90.0145, "eval_samples_per_second": 111.082, "eval_steps_per_second": 6.943, "step": 60000 }, { "epoch": 1.51, "learning_rate": 0.000738487048714921, "loss": 0.0691, "step": 60010 }, { "epoch": 1.51, "learning_rate": 0.0007381101926990427, "loss": 0.0659, "step": 60020 }, { "epoch": 1.51, "learning_rate": 0.0007377333366831646, "loss": 0.0685, "step": 60030 }, { "epoch": 1.51, "learning_rate": 0.0007373564806672863, "loss": 0.066, "step": 60040 }, { "epoch": 1.51, "learning_rate": 0.0007369796246514082, "loss": 0.07, "step": 60050 }, { "epoch": 1.51, "learning_rate": 0.0007366027686355299, "loss": 0.0656, "step": 60060 }, { "epoch": 1.51, "learning_rate": 0.0007362259126196518, "loss": 0.0708, "step": 60070 }, { "epoch": 1.51, "learning_rate": 0.0007358490566037737, "loss": 0.0699, "step": 60080 }, { "epoch": 1.51, "learning_rate": 0.0007354722005878954, "loss": 0.0696, "step": 60090 }, { "epoch": 1.51, "learning_rate": 0.0007350953445720172, "loss": 0.0668, "step": 60100 }, { "epoch": 1.51, "learning_rate": 0.000734718488556139, "loss": 0.0668, "step": 60110 }, { "epoch": 1.51, "learning_rate": 0.0007343416325402608, "loss": 0.0692, "step": 60120 }, { "epoch": 1.51, "learning_rate": 0.0007339647765243826, "loss": 0.0663, "step": 60130 }, { "epoch": 1.51, "learning_rate": 0.0007335879205085044, "loss": 0.0665, "step": 60140 }, { "epoch": 1.51, "learning_rate": 0.0007332110644926262, "loss": 0.0671, "step": 60150 }, { "epoch": 1.51, "learning_rate": 0.000732834208476748, "loss": 0.0675, "step": 60160 }, { "epoch": 1.51, "learning_rate": 0.0007324573524608698, "loss": 0.0667, "step": 60170 }, { "epoch": 1.51, "learning_rate": 0.0007320804964449916, "loss": 0.0687, "step": 60180 }, { "epoch": 1.51, "learning_rate": 0.0007317036404291134, "loss": 0.0699, "step": 60190 }, { "epoch": 1.51, "learning_rate": 0.0007313267844132351, "loss": 0.0704, "step": 60200 }, { "epoch": 1.51, "learning_rate": 0.000730949928397357, "loss": 0.0676, "step": 60210 }, { "epoch": 1.51, "learning_rate": 0.0007305730723814787, "loss": 0.0685, "step": 60220 }, { "epoch": 1.51, "learning_rate": 0.0007301962163656006, "loss": 0.0681, "step": 60230 }, { "epoch": 1.51, "learning_rate": 0.0007298193603497223, "loss": 0.0703, "step": 60240 }, { "epoch": 1.51, "learning_rate": 0.0007294425043338442, "loss": 0.068, "step": 60250 }, { "epoch": 1.51, "learning_rate": 0.000729065648317966, "loss": 0.067, "step": 60260 }, { "epoch": 1.51, "learning_rate": 0.0007286887923020878, "loss": 0.0683, "step": 60270 }, { "epoch": 1.51, "learning_rate": 0.0007283119362862096, "loss": 0.0679, "step": 60280 }, { "epoch": 1.51, "learning_rate": 0.0007279350802703314, "loss": 0.0664, "step": 60290 }, { "epoch": 1.51, "learning_rate": 0.0007275582242544532, "loss": 0.0672, "step": 60300 }, { "epoch": 1.52, "learning_rate": 0.000727181368238575, "loss": 0.0662, "step": 60310 }, { "epoch": 1.52, "learning_rate": 0.0007268045122226968, "loss": 0.0686, "step": 60320 }, { "epoch": 1.52, "learning_rate": 0.0007264276562068186, "loss": 0.0696, "step": 60330 }, { "epoch": 1.52, "learning_rate": 0.0007260508001909404, "loss": 0.0707, "step": 60340 }, { "epoch": 1.52, "learning_rate": 0.0007256739441750622, "loss": 0.0688, "step": 60350 }, { "epoch": 1.52, "learning_rate": 0.000725297088159184, "loss": 0.0695, "step": 60360 }, { "epoch": 1.52, "learning_rate": 0.0007249202321433059, "loss": 0.065, "step": 60370 }, { "epoch": 1.52, "learning_rate": 0.0007245433761274276, "loss": 0.0668, "step": 60380 }, { "epoch": 1.52, "learning_rate": 0.0007241665201115495, "loss": 0.0684, "step": 60390 }, { "epoch": 1.52, "learning_rate": 0.0007237896640956712, "loss": 0.0677, "step": 60400 }, { "epoch": 1.52, "learning_rate": 0.000723412808079793, "loss": 0.0666, "step": 60410 }, { "epoch": 1.52, "learning_rate": 0.0007230359520639148, "loss": 0.0679, "step": 60420 }, { "epoch": 1.52, "learning_rate": 0.0007226590960480366, "loss": 0.0676, "step": 60430 }, { "epoch": 1.52, "learning_rate": 0.0007222822400321584, "loss": 0.0691, "step": 60440 }, { "epoch": 1.52, "learning_rate": 0.0007219053840162802, "loss": 0.0655, "step": 60450 }, { "epoch": 1.52, "learning_rate": 0.000721528528000402, "loss": 0.0656, "step": 60460 }, { "epoch": 1.52, "learning_rate": 0.0007211516719845238, "loss": 0.068, "step": 60470 }, { "epoch": 1.52, "learning_rate": 0.0007207748159686456, "loss": 0.069, "step": 60480 }, { "epoch": 1.52, "learning_rate": 0.0007203979599527673, "loss": 0.0673, "step": 60490 }, { "epoch": 1.52, "learning_rate": 0.0007200211039368892, "loss": 0.0668, "step": 60500 }, { "epoch": 1.52, "eval_cer": 0.6654361607059072, "eval_loss": 0.057778164744377136, "eval_runtime": 90.8472, "eval_samples_per_second": 110.064, "eval_steps_per_second": 6.88, "step": 60500 }, { "epoch": 1.52, "learning_rate": 0.000719644247921011, "loss": 0.0698, "step": 60510 }, { "epoch": 1.52, "learning_rate": 0.0007192673919051328, "loss": 0.0697, "step": 60520 }, { "epoch": 1.52, "learning_rate": 0.0007188905358892545, "loss": 0.0695, "step": 60530 }, { "epoch": 1.52, "learning_rate": 0.0007185136798733764, "loss": 0.0689, "step": 60540 }, { "epoch": 1.52, "learning_rate": 0.0007181368238574983, "loss": 0.0695, "step": 60550 }, { "epoch": 1.52, "learning_rate": 0.00071775996784162, "loss": 0.0681, "step": 60560 }, { "epoch": 1.52, "learning_rate": 0.0007173831118257418, "loss": 0.068, "step": 60570 }, { "epoch": 1.52, "learning_rate": 0.0007170062558098636, "loss": 0.0631, "step": 60580 }, { "epoch": 1.52, "learning_rate": 0.0007166293997939854, "loss": 0.0691, "step": 60590 }, { "epoch": 1.52, "learning_rate": 0.0007162525437781072, "loss": 0.0687, "step": 60600 }, { "epoch": 1.52, "learning_rate": 0.000715875687762229, "loss": 0.067, "step": 60610 }, { "epoch": 1.52, "learning_rate": 0.0007154988317463508, "loss": 0.0693, "step": 60620 }, { "epoch": 1.52, "learning_rate": 0.0007151219757304725, "loss": 0.0688, "step": 60630 }, { "epoch": 1.52, "learning_rate": 0.0007147451197145944, "loss": 0.0675, "step": 60640 }, { "epoch": 1.52, "learning_rate": 0.0007143682636987161, "loss": 0.0664, "step": 60650 }, { "epoch": 1.52, "learning_rate": 0.000713991407682838, "loss": 0.0664, "step": 60660 }, { "epoch": 1.52, "learning_rate": 0.0007136145516669597, "loss": 0.0685, "step": 60670 }, { "epoch": 1.52, "learning_rate": 0.0007132376956510816, "loss": 0.0655, "step": 60680 }, { "epoch": 1.52, "learning_rate": 0.0007128608396352033, "loss": 0.0665, "step": 60690 }, { "epoch": 1.52, "learning_rate": 0.0007124839836193252, "loss": 0.0638, "step": 60700 }, { "epoch": 1.53, "learning_rate": 0.000712107127603447, "loss": 0.0678, "step": 60710 }, { "epoch": 1.53, "learning_rate": 0.0007117302715875688, "loss": 0.0653, "step": 60720 }, { "epoch": 1.53, "learning_rate": 0.0007113534155716906, "loss": 0.067, "step": 60730 }, { "epoch": 1.53, "learning_rate": 0.0007109765595558124, "loss": 0.0661, "step": 60740 }, { "epoch": 1.53, "learning_rate": 0.0007105997035399342, "loss": 0.0675, "step": 60750 }, { "epoch": 1.53, "learning_rate": 0.000710222847524056, "loss": 0.0693, "step": 60760 }, { "epoch": 1.53, "learning_rate": 0.0007098459915081778, "loss": 0.0674, "step": 60770 }, { "epoch": 1.53, "learning_rate": 0.0007094691354922996, "loss": 0.0656, "step": 60780 }, { "epoch": 1.53, "learning_rate": 0.0007090922794764214, "loss": 0.0652, "step": 60790 }, { "epoch": 1.53, "learning_rate": 0.0007087154234605432, "loss": 0.0667, "step": 60800 }, { "epoch": 1.53, "learning_rate": 0.000708338567444665, "loss": 0.0663, "step": 60810 }, { "epoch": 1.53, "learning_rate": 0.0007079617114287869, "loss": 0.0697, "step": 60820 }, { "epoch": 1.53, "learning_rate": 0.0007075848554129086, "loss": 0.0671, "step": 60830 }, { "epoch": 1.53, "learning_rate": 0.0007072079993970305, "loss": 0.0667, "step": 60840 }, { "epoch": 1.53, "learning_rate": 0.0007068311433811522, "loss": 0.068, "step": 60850 }, { "epoch": 1.53, "learning_rate": 0.000706454287365274, "loss": 0.0701, "step": 60860 }, { "epoch": 1.53, "learning_rate": 0.0007060774313493957, "loss": 0.0699, "step": 60870 }, { "epoch": 1.53, "learning_rate": 0.0007057005753335176, "loss": 0.067, "step": 60880 }, { "epoch": 1.53, "learning_rate": 0.0007053237193176394, "loss": 0.0658, "step": 60890 }, { "epoch": 1.53, "learning_rate": 0.0007049468633017612, "loss": 0.0675, "step": 60900 }, { "epoch": 1.53, "learning_rate": 0.000704570007285883, "loss": 0.0681, "step": 60910 }, { "epoch": 1.53, "learning_rate": 0.0007041931512700048, "loss": 0.0667, "step": 60920 }, { "epoch": 1.53, "learning_rate": 0.0007038162952541266, "loss": 0.0652, "step": 60930 }, { "epoch": 1.53, "learning_rate": 0.0007034394392382484, "loss": 0.068, "step": 60940 }, { "epoch": 1.53, "learning_rate": 0.0007030625832223702, "loss": 0.0657, "step": 60950 }, { "epoch": 1.53, "learning_rate": 0.000702685727206492, "loss": 0.0681, "step": 60960 }, { "epoch": 1.53, "learning_rate": 0.0007023088711906138, "loss": 0.0685, "step": 60970 }, { "epoch": 1.53, "learning_rate": 0.0007019320151747355, "loss": 0.0691, "step": 60980 }, { "epoch": 1.53, "learning_rate": 0.0007015551591588574, "loss": 0.0701, "step": 60990 }, { "epoch": 1.53, "learning_rate": 0.0007011783031429793, "loss": 0.0684, "step": 61000 }, { "epoch": 1.53, "eval_cer": 0.6652614740951306, "eval_loss": 0.05754827708005905, "eval_runtime": 90.703, "eval_samples_per_second": 110.239, "eval_steps_per_second": 6.891, "step": 61000 }, { "epoch": 1.53, "learning_rate": 0.000700801447127101, "loss": 0.0681, "step": 61010 }, { "epoch": 1.53, "learning_rate": 0.0007004245911112229, "loss": 0.0694, "step": 61020 }, { "epoch": 1.53, "learning_rate": 0.0007000477350953446, "loss": 0.0651, "step": 61030 }, { "epoch": 1.53, "learning_rate": 0.0006996708790794664, "loss": 0.0684, "step": 61040 }, { "epoch": 1.53, "learning_rate": 0.0006992940230635882, "loss": 0.0679, "step": 61050 }, { "epoch": 1.53, "learning_rate": 0.00069891716704771, "loss": 0.0683, "step": 61060 }, { "epoch": 1.53, "learning_rate": 0.0006985403110318318, "loss": 0.0679, "step": 61070 }, { "epoch": 1.53, "learning_rate": 0.0006981634550159535, "loss": 0.0656, "step": 61080 }, { "epoch": 1.53, "learning_rate": 0.0006977865990000754, "loss": 0.065, "step": 61090 }, { "epoch": 1.54, "learning_rate": 0.0006974097429841971, "loss": 0.0667, "step": 61100 }, { "epoch": 1.54, "learning_rate": 0.000697032886968319, "loss": 0.067, "step": 61110 }, { "epoch": 1.54, "learning_rate": 0.0006966560309524407, "loss": 0.068, "step": 61120 }, { "epoch": 1.54, "learning_rate": 0.0006962791749365626, "loss": 0.0671, "step": 61130 }, { "epoch": 1.54, "learning_rate": 0.0006959023189206843, "loss": 0.0662, "step": 61140 }, { "epoch": 1.54, "learning_rate": 0.0006955254629048062, "loss": 0.0676, "step": 61150 }, { "epoch": 1.54, "learning_rate": 0.0006951486068889279, "loss": 0.0679, "step": 61160 }, { "epoch": 1.54, "learning_rate": 0.0006947717508730498, "loss": 0.0686, "step": 61170 }, { "epoch": 1.54, "learning_rate": 0.0006943948948571716, "loss": 0.0684, "step": 61180 }, { "epoch": 1.54, "learning_rate": 0.0006940180388412934, "loss": 0.0653, "step": 61190 }, { "epoch": 1.54, "learning_rate": 0.0006936411828254152, "loss": 0.0682, "step": 61200 }, { "epoch": 1.54, "learning_rate": 0.000693264326809537, "loss": 0.0668, "step": 61210 }, { "epoch": 1.54, "learning_rate": 0.0006928874707936588, "loss": 0.0671, "step": 61220 }, { "epoch": 1.54, "learning_rate": 0.0006925106147777806, "loss": 0.065, "step": 61230 }, { "epoch": 1.54, "learning_rate": 0.0006921337587619024, "loss": 0.0694, "step": 61240 }, { "epoch": 1.54, "learning_rate": 0.0006917569027460242, "loss": 0.0658, "step": 61250 }, { "epoch": 1.54, "learning_rate": 0.000691380046730146, "loss": 0.0692, "step": 61260 }, { "epoch": 1.54, "learning_rate": 0.0006910031907142678, "loss": 0.066, "step": 61270 }, { "epoch": 1.54, "learning_rate": 0.0006906263346983896, "loss": 0.0656, "step": 61280 }, { "epoch": 1.54, "learning_rate": 0.0006902494786825115, "loss": 0.0684, "step": 61290 }, { "epoch": 1.54, "learning_rate": 0.0006898726226666331, "loss": 0.0674, "step": 61300 }, { "epoch": 1.54, "learning_rate": 0.000689495766650755, "loss": 0.0688, "step": 61310 }, { "epoch": 1.54, "learning_rate": 0.0006891189106348767, "loss": 0.0688, "step": 61320 }, { "epoch": 1.54, "learning_rate": 0.0006887420546189986, "loss": 0.0672, "step": 61330 }, { "epoch": 1.54, "learning_rate": 0.0006883651986031203, "loss": 0.065, "step": 61340 }, { "epoch": 1.54, "learning_rate": 0.0006879883425872422, "loss": 0.0691, "step": 61350 }, { "epoch": 1.54, "learning_rate": 0.000687611486571364, "loss": 0.0709, "step": 61360 }, { "epoch": 1.54, "learning_rate": 0.0006872346305554858, "loss": 0.0676, "step": 61370 }, { "epoch": 1.54, "learning_rate": 0.0006868577745396076, "loss": 0.0668, "step": 61380 }, { "epoch": 1.54, "learning_rate": 0.0006864809185237294, "loss": 0.069, "step": 61390 }, { "epoch": 1.54, "learning_rate": 0.0006861040625078512, "loss": 0.064, "step": 61400 }, { "epoch": 1.54, "learning_rate": 0.000685727206491973, "loss": 0.0661, "step": 61410 }, { "epoch": 1.54, "learning_rate": 0.0006853503504760948, "loss": 0.0712, "step": 61420 }, { "epoch": 1.54, "learning_rate": 0.0006849734944602165, "loss": 0.0652, "step": 61430 }, { "epoch": 1.54, "learning_rate": 0.0006845966384443384, "loss": 0.0686, "step": 61440 }, { "epoch": 1.54, "learning_rate": 0.0006842197824284601, "loss": 0.0654, "step": 61450 }, { "epoch": 1.54, "learning_rate": 0.000683842926412582, "loss": 0.0674, "step": 61460 }, { "epoch": 1.54, "learning_rate": 0.0006834660703967039, "loss": 0.0647, "step": 61470 }, { "epoch": 1.54, "learning_rate": 0.0006830892143808256, "loss": 0.0708, "step": 61480 }, { "epoch": 1.54, "learning_rate": 0.0006827123583649474, "loss": 0.0674, "step": 61490 }, { "epoch": 1.55, "learning_rate": 0.0006823355023490692, "loss": 0.0688, "step": 61500 }, { "epoch": 1.55, "eval_cer": 0.6651676341802506, "eval_loss": 0.057114891707897186, "eval_runtime": 90.5132, "eval_samples_per_second": 110.47, "eval_steps_per_second": 6.905, "step": 61500 }, { "epoch": 1.55, "learning_rate": 0.000681958646333191, "loss": 0.0684, "step": 61510 }, { "epoch": 1.55, "learning_rate": 0.0006815817903173128, "loss": 0.0659, "step": 61520 }, { "epoch": 1.55, "learning_rate": 0.0006812049343014345, "loss": 0.0671, "step": 61530 }, { "epoch": 1.55, "learning_rate": 0.0006808280782855564, "loss": 0.0678, "step": 61540 }, { "epoch": 1.55, "learning_rate": 0.0006804512222696781, "loss": 0.0649, "step": 61550 }, { "epoch": 1.55, "learning_rate": 0.0006800743662538, "loss": 0.065, "step": 61560 }, { "epoch": 1.55, "learning_rate": 0.0006796975102379217, "loss": 0.0647, "step": 61570 }, { "epoch": 1.55, "learning_rate": 0.0006793206542220436, "loss": 0.0667, "step": 61580 }, { "epoch": 1.55, "learning_rate": 0.0006789437982061653, "loss": 0.0674, "step": 61590 }, { "epoch": 1.55, "learning_rate": 0.0006785669421902872, "loss": 0.0648, "step": 61600 }, { "epoch": 1.55, "learning_rate": 0.0006781900861744089, "loss": 0.0641, "step": 61610 }, { "epoch": 1.55, "learning_rate": 0.0006778132301585308, "loss": 0.0651, "step": 61620 }, { "epoch": 1.55, "learning_rate": 0.0006774363741426525, "loss": 0.0684, "step": 61630 }, { "epoch": 1.55, "learning_rate": 0.0006770595181267744, "loss": 0.0655, "step": 61640 }, { "epoch": 1.55, "learning_rate": 0.0006766826621108962, "loss": 0.0677, "step": 61650 }, { "epoch": 1.55, "learning_rate": 0.000676305806095018, "loss": 0.068, "step": 61660 }, { "epoch": 1.55, "learning_rate": 0.0006759289500791398, "loss": 0.0647, "step": 61670 }, { "epoch": 1.55, "learning_rate": 0.0006755520940632616, "loss": 0.0642, "step": 61680 }, { "epoch": 1.55, "learning_rate": 0.0006751752380473834, "loss": 0.0663, "step": 61690 }, { "epoch": 1.55, "learning_rate": 0.0006747983820315052, "loss": 0.0642, "step": 61700 }, { "epoch": 1.55, "learning_rate": 0.000674421526015627, "loss": 0.0679, "step": 61710 }, { "epoch": 1.55, "learning_rate": 0.0006740446699997488, "loss": 0.0702, "step": 61720 }, { "epoch": 1.55, "learning_rate": 0.0006736678139838706, "loss": 0.0678, "step": 61730 }, { "epoch": 1.55, "learning_rate": 0.0006732909579679924, "loss": 0.0685, "step": 61740 }, { "epoch": 1.55, "learning_rate": 0.0006729141019521141, "loss": 0.0663, "step": 61750 }, { "epoch": 1.55, "learning_rate": 0.000672537245936236, "loss": 0.0666, "step": 61760 }, { "epoch": 1.55, "learning_rate": 0.0006721603899203577, "loss": 0.0691, "step": 61770 }, { "epoch": 1.55, "learning_rate": 0.0006717835339044796, "loss": 0.066, "step": 61780 }, { "epoch": 1.55, "learning_rate": 0.0006714066778886013, "loss": 0.0692, "step": 61790 }, { "epoch": 1.55, "learning_rate": 0.0006710298218727232, "loss": 0.0679, "step": 61800 }, { "epoch": 1.55, "learning_rate": 0.000670652965856845, "loss": 0.066, "step": 61810 }, { "epoch": 1.55, "learning_rate": 0.0006702761098409668, "loss": 0.0687, "step": 61820 }, { "epoch": 1.55, "learning_rate": 0.0006698992538250886, "loss": 0.069, "step": 61830 }, { "epoch": 1.55, "learning_rate": 0.0006695223978092104, "loss": 0.0663, "step": 61840 }, { "epoch": 1.55, "learning_rate": 0.0006691455417933322, "loss": 0.067, "step": 61850 }, { "epoch": 1.55, "learning_rate": 0.000668768685777454, "loss": 0.0697, "step": 61860 }, { "epoch": 1.55, "learning_rate": 0.0006683918297615758, "loss": 0.0657, "step": 61870 }, { "epoch": 1.55, "learning_rate": 0.0006680149737456976, "loss": 0.0666, "step": 61880 }, { "epoch": 1.55, "learning_rate": 0.0006676381177298194, "loss": 0.0674, "step": 61890 }, { "epoch": 1.56, "learning_rate": 0.0006672612617139411, "loss": 0.0653, "step": 61900 }, { "epoch": 1.56, "learning_rate": 0.000666884405698063, "loss": 0.0667, "step": 61910 }, { "epoch": 1.56, "learning_rate": 0.0006665075496821847, "loss": 0.0651, "step": 61920 }, { "epoch": 1.56, "learning_rate": 0.0006661306936663066, "loss": 0.0667, "step": 61930 }, { "epoch": 1.56, "learning_rate": 0.0006657538376504285, "loss": 0.065, "step": 61940 }, { "epoch": 1.56, "learning_rate": 0.0006653769816345502, "loss": 0.068, "step": 61950 }, { "epoch": 1.56, "learning_rate": 0.000665000125618672, "loss": 0.0639, "step": 61960 }, { "epoch": 1.56, "learning_rate": 0.0006646232696027937, "loss": 0.0669, "step": 61970 }, { "epoch": 1.56, "learning_rate": 0.0006642464135869155, "loss": 0.0688, "step": 61980 }, { "epoch": 1.56, "learning_rate": 0.0006638695575710374, "loss": 0.0689, "step": 61990 }, { "epoch": 1.56, "learning_rate": 0.0006634927015551591, "loss": 0.068, "step": 62000 }, { "epoch": 1.56, "eval_cer": 0.6652715799321176, "eval_loss": 0.057154275476932526, "eval_runtime": 90.7336, "eval_samples_per_second": 110.202, "eval_steps_per_second": 6.888, "step": 62000 }, { "epoch": 1.56, "learning_rate": 0.000663115845539281, "loss": 0.0659, "step": 62010 }, { "epoch": 1.56, "learning_rate": 0.0006627389895234027, "loss": 0.0678, "step": 62020 }, { "epoch": 1.56, "learning_rate": 0.0006623621335075246, "loss": 0.0661, "step": 62030 }, { "epoch": 1.56, "learning_rate": 0.0006619852774916463, "loss": 0.0668, "step": 62040 }, { "epoch": 1.56, "learning_rate": 0.0006616084214757682, "loss": 0.0666, "step": 62050 }, { "epoch": 1.56, "learning_rate": 0.0006612315654598899, "loss": 0.0656, "step": 62060 }, { "epoch": 1.56, "learning_rate": 0.0006608547094440118, "loss": 0.0658, "step": 62070 }, { "epoch": 1.56, "learning_rate": 0.0006604778534281335, "loss": 0.0661, "step": 62080 }, { "epoch": 1.56, "learning_rate": 0.0006601009974122554, "loss": 0.0676, "step": 62090 }, { "epoch": 1.56, "learning_rate": 0.0006597241413963772, "loss": 0.0702, "step": 62100 }, { "epoch": 1.56, "learning_rate": 0.000659347285380499, "loss": 0.0653, "step": 62110 }, { "epoch": 1.56, "learning_rate": 0.0006589704293646208, "loss": 0.0682, "step": 62120 }, { "epoch": 1.56, "learning_rate": 0.0006585935733487426, "loss": 0.0672, "step": 62130 }, { "epoch": 1.56, "learning_rate": 0.0006582167173328644, "loss": 0.0708, "step": 62140 }, { "epoch": 1.56, "learning_rate": 0.0006578398613169862, "loss": 0.0669, "step": 62150 }, { "epoch": 1.56, "learning_rate": 0.000657463005301108, "loss": 0.0646, "step": 62160 }, { "epoch": 1.56, "learning_rate": 0.0006570861492852298, "loss": 0.0681, "step": 62170 }, { "epoch": 1.56, "learning_rate": 0.0006567092932693516, "loss": 0.0662, "step": 62180 }, { "epoch": 1.56, "learning_rate": 0.0006563324372534734, "loss": 0.0659, "step": 62190 }, { "epoch": 1.56, "learning_rate": 0.0006559555812375951, "loss": 0.0683, "step": 62200 }, { "epoch": 1.56, "learning_rate": 0.000655578725221717, "loss": 0.0662, "step": 62210 }, { "epoch": 1.56, "learning_rate": 0.0006552018692058387, "loss": 0.0671, "step": 62220 }, { "epoch": 1.56, "learning_rate": 0.0006548250131899606, "loss": 0.0654, "step": 62230 }, { "epoch": 1.56, "learning_rate": 0.0006544481571740823, "loss": 0.0672, "step": 62240 }, { "epoch": 1.56, "learning_rate": 0.0006540713011582042, "loss": 0.0675, "step": 62250 }, { "epoch": 1.56, "learning_rate": 0.0006536944451423259, "loss": 0.0648, "step": 62260 }, { "epoch": 1.56, "learning_rate": 0.0006533175891264478, "loss": 0.0667, "step": 62270 }, { "epoch": 1.56, "learning_rate": 0.0006529407331105696, "loss": 0.0675, "step": 62280 }, { "epoch": 1.56, "learning_rate": 0.0006525638770946914, "loss": 0.069, "step": 62290 }, { "epoch": 1.57, "learning_rate": 0.0006521870210788132, "loss": 0.0685, "step": 62300 }, { "epoch": 1.57, "learning_rate": 0.000651810165062935, "loss": 0.0672, "step": 62310 }, { "epoch": 1.57, "learning_rate": 0.0006514333090470568, "loss": 0.0685, "step": 62320 }, { "epoch": 1.57, "learning_rate": 0.0006510564530311786, "loss": 0.0649, "step": 62330 }, { "epoch": 1.57, "learning_rate": 0.0006506795970153004, "loss": 0.0662, "step": 62340 }, { "epoch": 1.57, "learning_rate": 0.0006503027409994221, "loss": 0.0644, "step": 62350 }, { "epoch": 1.57, "learning_rate": 0.000649925884983544, "loss": 0.0676, "step": 62360 }, { "epoch": 1.57, "learning_rate": 0.0006495490289676657, "loss": 0.0633, "step": 62370 }, { "epoch": 1.57, "learning_rate": 0.0006491721729517876, "loss": 0.0665, "step": 62380 }, { "epoch": 1.57, "learning_rate": 0.0006487953169359095, "loss": 0.0652, "step": 62390 }, { "epoch": 1.57, "learning_rate": 0.0006484184609200312, "loss": 0.0693, "step": 62400 }, { "epoch": 1.57, "learning_rate": 0.0006480416049041529, "loss": 0.0653, "step": 62410 }, { "epoch": 1.57, "learning_rate": 0.0006476647488882747, "loss": 0.0638, "step": 62420 }, { "epoch": 1.57, "learning_rate": 0.0006472878928723965, "loss": 0.0688, "step": 62430 }, { "epoch": 1.57, "learning_rate": 0.0006469110368565183, "loss": 0.0649, "step": 62440 }, { "epoch": 1.57, "learning_rate": 0.0006465341808406401, "loss": 0.0673, "step": 62450 }, { "epoch": 1.57, "learning_rate": 0.000646157324824762, "loss": 0.0677, "step": 62460 }, { "epoch": 1.57, "learning_rate": 0.0006457804688088837, "loss": 0.0645, "step": 62470 }, { "epoch": 1.57, "learning_rate": 0.0006454036127930056, "loss": 0.0678, "step": 62480 }, { "epoch": 1.57, "learning_rate": 0.0006450267567771273, "loss": 0.0665, "step": 62490 }, { "epoch": 1.57, "learning_rate": 0.0006446499007612492, "loss": 0.0694, "step": 62500 }, { "epoch": 1.57, "eval_cer": 0.6654116179589386, "eval_loss": 0.056619539856910706, "eval_runtime": 90.723, "eval_samples_per_second": 110.215, "eval_steps_per_second": 6.889, "step": 62500 }, { "epoch": 1.57, "learning_rate": 0.0006442730447453709, "loss": 0.0661, "step": 62510 }, { "epoch": 1.57, "learning_rate": 0.0006438961887294928, "loss": 0.0666, "step": 62520 }, { "epoch": 1.57, "learning_rate": 0.0006435193327136145, "loss": 0.0644, "step": 62530 }, { "epoch": 1.57, "learning_rate": 0.0006431424766977364, "loss": 0.0678, "step": 62540 }, { "epoch": 1.57, "learning_rate": 0.0006427656206818581, "loss": 0.0662, "step": 62550 }, { "epoch": 1.57, "learning_rate": 0.00064238876466598, "loss": 0.0655, "step": 62560 }, { "epoch": 1.57, "learning_rate": 0.0006420119086501018, "loss": 0.0678, "step": 62570 }, { "epoch": 1.57, "learning_rate": 0.0006416350526342236, "loss": 0.0658, "step": 62580 }, { "epoch": 1.57, "learning_rate": 0.0006412581966183454, "loss": 0.0639, "step": 62590 }, { "epoch": 1.57, "learning_rate": 0.0006408813406024672, "loss": 0.0676, "step": 62600 }, { "epoch": 1.57, "learning_rate": 0.000640504484586589, "loss": 0.0629, "step": 62610 }, { "epoch": 1.57, "learning_rate": 0.0006401276285707108, "loss": 0.0663, "step": 62620 }, { "epoch": 1.57, "learning_rate": 0.0006397507725548326, "loss": 0.0672, "step": 62630 }, { "epoch": 1.57, "learning_rate": 0.0006393739165389544, "loss": 0.0659, "step": 62640 }, { "epoch": 1.57, "learning_rate": 0.0006389970605230761, "loss": 0.0648, "step": 62650 }, { "epoch": 1.57, "learning_rate": 0.000638620204507198, "loss": 0.0633, "step": 62660 }, { "epoch": 1.57, "learning_rate": 0.0006382433484913197, "loss": 0.0688, "step": 62670 }, { "epoch": 1.57, "learning_rate": 0.0006378664924754416, "loss": 0.0658, "step": 62680 }, { "epoch": 1.57, "learning_rate": 0.0006374896364595633, "loss": 0.0654, "step": 62690 }, { "epoch": 1.58, "learning_rate": 0.0006371127804436852, "loss": 0.0673, "step": 62700 }, { "epoch": 1.58, "learning_rate": 0.0006367359244278069, "loss": 0.0643, "step": 62710 }, { "epoch": 1.58, "learning_rate": 0.0006363590684119288, "loss": 0.0677, "step": 62720 }, { "epoch": 1.58, "learning_rate": 0.0006359822123960505, "loss": 0.0652, "step": 62730 }, { "epoch": 1.58, "learning_rate": 0.0006356053563801724, "loss": 0.0651, "step": 62740 }, { "epoch": 1.58, "learning_rate": 0.0006352285003642942, "loss": 0.0663, "step": 62750 }, { "epoch": 1.58, "learning_rate": 0.000634851644348416, "loss": 0.067, "step": 62760 }, { "epoch": 1.58, "learning_rate": 0.0006344747883325378, "loss": 0.0712, "step": 62770 }, { "epoch": 1.58, "learning_rate": 0.0006340979323166596, "loss": 0.0674, "step": 62780 }, { "epoch": 1.58, "learning_rate": 0.0006337210763007814, "loss": 0.0645, "step": 62790 }, { "epoch": 1.58, "learning_rate": 0.0006333442202849032, "loss": 0.0656, "step": 62800 }, { "epoch": 1.58, "learning_rate": 0.000632967364269025, "loss": 0.0675, "step": 62810 }, { "epoch": 1.58, "learning_rate": 0.0006325905082531467, "loss": 0.0687, "step": 62820 }, { "epoch": 1.58, "learning_rate": 0.0006322136522372686, "loss": 0.0671, "step": 62830 }, { "epoch": 1.58, "learning_rate": 0.0006318367962213903, "loss": 0.0662, "step": 62840 }, { "epoch": 1.58, "learning_rate": 0.0006314599402055122, "loss": 0.0606, "step": 62850 }, { "epoch": 1.58, "learning_rate": 0.0006310830841896339, "loss": 0.0666, "step": 62860 }, { "epoch": 1.58, "learning_rate": 0.0006307062281737557, "loss": 0.0664, "step": 62870 }, { "epoch": 1.58, "learning_rate": 0.0006303293721578775, "loss": 0.0684, "step": 62880 }, { "epoch": 1.58, "learning_rate": 0.0006299525161419993, "loss": 0.066, "step": 62890 }, { "epoch": 1.58, "learning_rate": 0.0006295756601261211, "loss": 0.0689, "step": 62900 }, { "epoch": 1.58, "learning_rate": 0.000629198804110243, "loss": 0.0677, "step": 62910 }, { "epoch": 1.58, "learning_rate": 0.0006288219480943647, "loss": 0.0666, "step": 62920 }, { "epoch": 1.58, "learning_rate": 0.0006284450920784866, "loss": 0.0675, "step": 62930 }, { "epoch": 1.58, "learning_rate": 0.0006280682360626083, "loss": 0.0684, "step": 62940 }, { "epoch": 1.58, "learning_rate": 0.0006276913800467302, "loss": 0.0654, "step": 62950 }, { "epoch": 1.58, "learning_rate": 0.0006273145240308519, "loss": 0.0703, "step": 62960 }, { "epoch": 1.58, "learning_rate": 0.0006269376680149738, "loss": 0.0691, "step": 62970 }, { "epoch": 1.58, "learning_rate": 0.0006265608119990955, "loss": 0.064, "step": 62980 }, { "epoch": 1.58, "learning_rate": 0.0006261839559832174, "loss": 0.066, "step": 62990 }, { "epoch": 1.58, "learning_rate": 0.0006258070999673391, "loss": 0.0642, "step": 63000 }, { "epoch": 1.58, "eval_cer": 0.6652528119491417, "eval_loss": 0.056862492114305496, "eval_runtime": 90.801, "eval_samples_per_second": 110.12, "eval_steps_per_second": 6.883, "step": 63000 }, { "epoch": 1.58, "learning_rate": 0.000625430243951461, "loss": 0.0663, "step": 63010 }, { "epoch": 1.58, "learning_rate": 0.0006250533879355827, "loss": 0.0663, "step": 63020 }, { "epoch": 1.58, "learning_rate": 0.0006246765319197046, "loss": 0.0627, "step": 63030 }, { "epoch": 1.58, "learning_rate": 0.0006242996759038264, "loss": 0.0667, "step": 63040 }, { "epoch": 1.58, "learning_rate": 0.0006239228198879482, "loss": 0.0653, "step": 63050 }, { "epoch": 1.58, "learning_rate": 0.00062354596387207, "loss": 0.0663, "step": 63060 }, { "epoch": 1.58, "learning_rate": 0.0006231691078561918, "loss": 0.0646, "step": 63070 }, { "epoch": 1.58, "learning_rate": 0.0006227922518403135, "loss": 0.0679, "step": 63080 }, { "epoch": 1.59, "learning_rate": 0.0006224153958244354, "loss": 0.0661, "step": 63090 }, { "epoch": 1.59, "learning_rate": 0.0006220385398085571, "loss": 0.0638, "step": 63100 }, { "epoch": 1.59, "learning_rate": 0.000621661683792679, "loss": 0.0663, "step": 63110 }, { "epoch": 1.59, "learning_rate": 0.0006212848277768007, "loss": 0.0645, "step": 63120 }, { "epoch": 1.59, "learning_rate": 0.0006209079717609226, "loss": 0.0713, "step": 63130 }, { "epoch": 1.59, "learning_rate": 0.0006205311157450443, "loss": 0.0679, "step": 63140 }, { "epoch": 1.59, "learning_rate": 0.0006201542597291662, "loss": 0.0675, "step": 63150 }, { "epoch": 1.59, "learning_rate": 0.0006197774037132879, "loss": 0.0652, "step": 63160 }, { "epoch": 1.59, "learning_rate": 0.0006194005476974098, "loss": 0.0698, "step": 63170 }, { "epoch": 1.59, "learning_rate": 0.0006190236916815315, "loss": 0.066, "step": 63180 }, { "epoch": 1.59, "learning_rate": 0.0006186468356656534, "loss": 0.0676, "step": 63190 }, { "epoch": 1.59, "learning_rate": 0.0006182699796497752, "loss": 0.0651, "step": 63200 }, { "epoch": 1.59, "learning_rate": 0.000617893123633897, "loss": 0.0647, "step": 63210 }, { "epoch": 1.59, "learning_rate": 0.0006175162676180188, "loss": 0.0659, "step": 63220 }, { "epoch": 1.59, "learning_rate": 0.0006171394116021406, "loss": 0.0676, "step": 63230 }, { "epoch": 1.59, "learning_rate": 0.0006167625555862624, "loss": 0.069, "step": 63240 }, { "epoch": 1.59, "learning_rate": 0.0006163856995703842, "loss": 0.0658, "step": 63250 }, { "epoch": 1.59, "learning_rate": 0.000616008843554506, "loss": 0.0674, "step": 63260 }, { "epoch": 1.59, "learning_rate": 0.0006156319875386278, "loss": 0.0663, "step": 63270 }, { "epoch": 1.59, "learning_rate": 0.0006152551315227496, "loss": 0.0642, "step": 63280 }, { "epoch": 1.59, "learning_rate": 0.0006148782755068713, "loss": 0.0672, "step": 63290 }, { "epoch": 1.59, "learning_rate": 0.0006145014194909931, "loss": 0.0697, "step": 63300 }, { "epoch": 1.59, "learning_rate": 0.000614124563475115, "loss": 0.0687, "step": 63310 }, { "epoch": 1.59, "learning_rate": 0.0006137477074592367, "loss": 0.0691, "step": 63320 }, { "epoch": 1.59, "learning_rate": 0.0006133708514433585, "loss": 0.0636, "step": 63330 }, { "epoch": 1.59, "learning_rate": 0.0006129939954274803, "loss": 0.0646, "step": 63340 }, { "epoch": 1.59, "learning_rate": 0.0006126171394116021, "loss": 0.0679, "step": 63350 }, { "epoch": 1.59, "learning_rate": 0.0006122402833957239, "loss": 0.0681, "step": 63360 }, { "epoch": 1.59, "learning_rate": 0.0006118634273798457, "loss": 0.0677, "step": 63370 }, { "epoch": 1.59, "learning_rate": 0.0006114865713639676, "loss": 0.069, "step": 63380 }, { "epoch": 1.59, "learning_rate": 0.0006111097153480893, "loss": 0.0669, "step": 63390 }, { "epoch": 1.59, "learning_rate": 0.0006107328593322112, "loss": 0.0653, "step": 63400 }, { "epoch": 1.59, "learning_rate": 0.0006103560033163329, "loss": 0.0675, "step": 63410 }, { "epoch": 1.59, "learning_rate": 0.0006099791473004548, "loss": 0.0661, "step": 63420 }, { "epoch": 1.59, "learning_rate": 0.0006096022912845765, "loss": 0.0651, "step": 63430 }, { "epoch": 1.59, "learning_rate": 0.0006092254352686984, "loss": 0.0635, "step": 63440 }, { "epoch": 1.59, "learning_rate": 0.0006088485792528201, "loss": 0.0673, "step": 63450 }, { "epoch": 1.59, "learning_rate": 0.000608471723236942, "loss": 0.0665, "step": 63460 }, { "epoch": 1.59, "learning_rate": 0.0006080948672210637, "loss": 0.0647, "step": 63470 }, { "epoch": 1.59, "learning_rate": 0.0006077180112051856, "loss": 0.0682, "step": 63480 }, { "epoch": 1.6, "learning_rate": 0.0006073411551893074, "loss": 0.0642, "step": 63490 }, { "epoch": 1.6, "learning_rate": 0.0006069642991734292, "loss": 0.0646, "step": 63500 }, { "epoch": 1.6, "eval_cer": 0.6655126763288093, "eval_loss": 0.05644620954990387, "eval_runtime": 90.7214, "eval_samples_per_second": 110.217, "eval_steps_per_second": 6.889, "step": 63500 }, { "epoch": 1.6, "learning_rate": 0.000606587443157551, "loss": 0.0665, "step": 63510 }, { "epoch": 1.6, "learning_rate": 0.0006062105871416728, "loss": 0.069, "step": 63520 }, { "epoch": 1.6, "learning_rate": 0.0006058337311257945, "loss": 0.0634, "step": 63530 }, { "epoch": 1.6, "learning_rate": 0.0006054568751099163, "loss": 0.0679, "step": 63540 }, { "epoch": 1.6, "learning_rate": 0.0006050800190940381, "loss": 0.0672, "step": 63550 }, { "epoch": 1.6, "learning_rate": 0.00060470316307816, "loss": 0.0651, "step": 63560 }, { "epoch": 1.6, "learning_rate": 0.0006043263070622817, "loss": 0.0625, "step": 63570 }, { "epoch": 1.6, "learning_rate": 0.0006039494510464036, "loss": 0.0644, "step": 63580 }, { "epoch": 1.6, "learning_rate": 0.0006035725950305253, "loss": 0.065, "step": 63590 }, { "epoch": 1.6, "learning_rate": 0.0006031957390146472, "loss": 0.0662, "step": 63600 }, { "epoch": 1.6, "learning_rate": 0.0006028188829987689, "loss": 0.0648, "step": 63610 }, { "epoch": 1.6, "learning_rate": 0.0006024420269828908, "loss": 0.0689, "step": 63620 }, { "epoch": 1.6, "learning_rate": 0.0006020651709670125, "loss": 0.0633, "step": 63630 }, { "epoch": 1.6, "learning_rate": 0.0006016883149511344, "loss": 0.0662, "step": 63640 }, { "epoch": 1.6, "learning_rate": 0.0006013114589352561, "loss": 0.0696, "step": 63650 }, { "epoch": 1.6, "learning_rate": 0.000600934602919378, "loss": 0.0647, "step": 63660 }, { "epoch": 1.6, "learning_rate": 0.0006005577469034998, "loss": 0.0669, "step": 63670 }, { "epoch": 1.6, "learning_rate": 0.0006001808908876216, "loss": 0.0628, "step": 63680 }, { "epoch": 1.6, "learning_rate": 0.0005998040348717434, "loss": 0.0649, "step": 63690 }, { "epoch": 1.6, "learning_rate": 0.0005994271788558652, "loss": 0.0676, "step": 63700 }, { "epoch": 1.6, "learning_rate": 0.000599050322839987, "loss": 0.0674, "step": 63710 }, { "epoch": 1.6, "learning_rate": 0.0005986734668241088, "loss": 0.0672, "step": 63720 }, { "epoch": 1.6, "learning_rate": 0.0005982966108082306, "loss": 0.0637, "step": 63730 }, { "epoch": 1.6, "learning_rate": 0.0005979197547923524, "loss": 0.0671, "step": 63740 }, { "epoch": 1.6, "learning_rate": 0.0005975428987764741, "loss": 0.0642, "step": 63750 }, { "epoch": 1.6, "learning_rate": 0.000597166042760596, "loss": 0.0694, "step": 63760 }, { "epoch": 1.6, "learning_rate": 0.0005967891867447177, "loss": 0.068, "step": 63770 }, { "epoch": 1.6, "learning_rate": 0.0005964123307288395, "loss": 0.0648, "step": 63780 }, { "epoch": 1.6, "learning_rate": 0.0005960354747129613, "loss": 0.0637, "step": 63790 }, { "epoch": 1.6, "learning_rate": 0.0005956586186970831, "loss": 0.0667, "step": 63800 }, { "epoch": 1.6, "learning_rate": 0.0005952817626812049, "loss": 0.0638, "step": 63810 }, { "epoch": 1.6, "learning_rate": 0.0005949049066653267, "loss": 0.0678, "step": 63820 }, { "epoch": 1.6, "learning_rate": 0.0005945280506494485, "loss": 0.0645, "step": 63830 }, { "epoch": 1.6, "learning_rate": 0.0005941511946335703, "loss": 0.0645, "step": 63840 }, { "epoch": 1.6, "learning_rate": 0.0005937743386176922, "loss": 0.0652, "step": 63850 }, { "epoch": 1.6, "learning_rate": 0.0005933974826018139, "loss": 0.0653, "step": 63860 }, { "epoch": 1.6, "learning_rate": 0.0005930206265859358, "loss": 0.0644, "step": 63870 }, { "epoch": 1.6, "learning_rate": 0.0005926437705700575, "loss": 0.0653, "step": 63880 }, { "epoch": 1.61, "learning_rate": 0.0005922669145541794, "loss": 0.0655, "step": 63890 }, { "epoch": 1.61, "learning_rate": 0.0005918900585383011, "loss": 0.0626, "step": 63900 }, { "epoch": 1.61, "learning_rate": 0.000591513202522423, "loss": 0.0648, "step": 63910 }, { "epoch": 1.61, "learning_rate": 0.0005911363465065447, "loss": 0.0666, "step": 63920 }, { "epoch": 1.61, "learning_rate": 0.0005907594904906666, "loss": 0.064, "step": 63930 }, { "epoch": 1.61, "learning_rate": 0.0005903826344747883, "loss": 0.0659, "step": 63940 }, { "epoch": 1.61, "learning_rate": 0.0005900057784589102, "loss": 0.0617, "step": 63950 }, { "epoch": 1.61, "learning_rate": 0.000589628922443032, "loss": 0.0635, "step": 63960 }, { "epoch": 1.61, "learning_rate": 0.0005892520664271537, "loss": 0.0669, "step": 63970 }, { "epoch": 1.61, "learning_rate": 0.0005888752104112755, "loss": 0.0678, "step": 63980 }, { "epoch": 1.61, "learning_rate": 0.0005884983543953973, "loss": 0.0632, "step": 63990 }, { "epoch": 1.61, "learning_rate": 0.0005881214983795191, "loss": 0.0633, "step": 64000 }, { "epoch": 1.61, "eval_cer": 0.6652961226790862, "eval_loss": 0.05655200034379959, "eval_runtime": 90.5197, "eval_samples_per_second": 110.462, "eval_steps_per_second": 6.905, "step": 64000 }, { "epoch": 1.61, "learning_rate": 0.0005877446423636409, "loss": 0.0661, "step": 64010 }, { "epoch": 1.61, "learning_rate": 0.0005873677863477627, "loss": 0.063, "step": 64020 }, { "epoch": 1.61, "learning_rate": 0.0005869909303318846, "loss": 0.0653, "step": 64030 }, { "epoch": 1.61, "learning_rate": 0.0005866140743160063, "loss": 0.0647, "step": 64040 }, { "epoch": 1.61, "learning_rate": 0.0005862372183001282, "loss": 0.0686, "step": 64050 }, { "epoch": 1.61, "learning_rate": 0.0005858603622842499, "loss": 0.0668, "step": 64060 }, { "epoch": 1.61, "learning_rate": 0.0005854835062683718, "loss": 0.066, "step": 64070 }, { "epoch": 1.61, "learning_rate": 0.0005851066502524935, "loss": 0.0656, "step": 64080 }, { "epoch": 1.61, "learning_rate": 0.0005847297942366154, "loss": 0.0696, "step": 64090 }, { "epoch": 1.61, "learning_rate": 0.0005843529382207371, "loss": 0.068, "step": 64100 }, { "epoch": 1.61, "learning_rate": 0.000583976082204859, "loss": 0.065, "step": 64110 }, { "epoch": 1.61, "learning_rate": 0.0005835992261889807, "loss": 0.0653, "step": 64120 }, { "epoch": 1.61, "learning_rate": 0.0005832223701731026, "loss": 0.0636, "step": 64130 }, { "epoch": 1.61, "learning_rate": 0.0005828455141572244, "loss": 0.0648, "step": 64140 }, { "epoch": 1.61, "learning_rate": 0.0005824686581413462, "loss": 0.0673, "step": 64150 }, { "epoch": 1.61, "learning_rate": 0.000582091802125468, "loss": 0.0669, "step": 64160 }, { "epoch": 1.61, "learning_rate": 0.0005817149461095898, "loss": 0.068, "step": 64170 }, { "epoch": 1.61, "learning_rate": 0.0005813380900937116, "loss": 0.0673, "step": 64180 }, { "epoch": 1.61, "learning_rate": 0.0005809612340778334, "loss": 0.0646, "step": 64190 }, { "epoch": 1.61, "learning_rate": 0.0005805843780619551, "loss": 0.0648, "step": 64200 }, { "epoch": 1.61, "learning_rate": 0.000580207522046077, "loss": 0.0657, "step": 64210 }, { "epoch": 1.61, "learning_rate": 0.0005798306660301987, "loss": 0.0656, "step": 64220 }, { "epoch": 1.61, "learning_rate": 0.0005794538100143205, "loss": 0.068, "step": 64230 }, { "epoch": 1.61, "learning_rate": 0.0005790769539984423, "loss": 0.0678, "step": 64240 }, { "epoch": 1.61, "learning_rate": 0.0005787000979825641, "loss": 0.0629, "step": 64250 }, { "epoch": 1.61, "learning_rate": 0.0005783232419666859, "loss": 0.0649, "step": 64260 }, { "epoch": 1.61, "learning_rate": 0.0005779463859508077, "loss": 0.0661, "step": 64270 }, { "epoch": 1.61, "learning_rate": 0.0005775695299349295, "loss": 0.0647, "step": 64280 }, { "epoch": 1.62, "learning_rate": 0.0005771926739190513, "loss": 0.0655, "step": 64290 }, { "epoch": 1.62, "learning_rate": 0.0005768158179031732, "loss": 0.0672, "step": 64300 }, { "epoch": 1.62, "learning_rate": 0.0005764389618872949, "loss": 0.064, "step": 64310 }, { "epoch": 1.62, "learning_rate": 0.0005760621058714168, "loss": 0.0671, "step": 64320 }, { "epoch": 1.62, "learning_rate": 0.0005756852498555385, "loss": 0.0636, "step": 64330 }, { "epoch": 1.62, "learning_rate": 0.0005753083938396604, "loss": 0.0665, "step": 64340 }, { "epoch": 1.62, "learning_rate": 0.0005749315378237821, "loss": 0.066, "step": 64350 }, { "epoch": 1.62, "learning_rate": 0.000574554681807904, "loss": 0.0613, "step": 64360 }, { "epoch": 1.62, "learning_rate": 0.0005741778257920257, "loss": 0.0641, "step": 64370 }, { "epoch": 1.62, "learning_rate": 0.0005738009697761476, "loss": 0.0628, "step": 64380 }, { "epoch": 1.62, "learning_rate": 0.0005734241137602693, "loss": 0.0681, "step": 64390 }, { "epoch": 1.62, "learning_rate": 0.0005730472577443912, "loss": 0.0676, "step": 64400 }, { "epoch": 1.62, "learning_rate": 0.0005726704017285129, "loss": 0.0678, "step": 64410 }, { "epoch": 1.62, "learning_rate": 0.0005722935457126347, "loss": 0.0646, "step": 64420 }, { "epoch": 1.62, "learning_rate": 0.0005719166896967565, "loss": 0.0644, "step": 64430 }, { "epoch": 1.62, "learning_rate": 0.0005715398336808783, "loss": 0.0644, "step": 64440 }, { "epoch": 1.62, "learning_rate": 0.0005711629776650001, "loss": 0.0675, "step": 64450 }, { "epoch": 1.62, "learning_rate": 0.0005707861216491219, "loss": 0.0668, "step": 64460 }, { "epoch": 1.62, "learning_rate": 0.0005704092656332437, "loss": 0.0619, "step": 64470 }, { "epoch": 1.62, "learning_rate": 0.0005700324096173656, "loss": 0.0675, "step": 64480 }, { "epoch": 1.62, "learning_rate": 0.0005696555536014873, "loss": 0.0654, "step": 64490 }, { "epoch": 1.62, "learning_rate": 0.0005692786975856092, "loss": 0.0677, "step": 64500 }, { "epoch": 1.62, "eval_cer": 0.6652701362411195, "eval_loss": 0.05630192533135414, "eval_runtime": 90.474, "eval_samples_per_second": 110.518, "eval_steps_per_second": 6.908, "step": 64500 }, { "epoch": 1.62, "learning_rate": 0.0005689018415697309, "loss": 0.064, "step": 64510 }, { "epoch": 1.62, "learning_rate": 0.0005685249855538528, "loss": 0.0656, "step": 64520 }, { "epoch": 1.62, "learning_rate": 0.0005681481295379745, "loss": 0.0626, "step": 64530 }, { "epoch": 1.62, "learning_rate": 0.0005677712735220964, "loss": 0.0626, "step": 64540 }, { "epoch": 1.62, "learning_rate": 0.0005673944175062181, "loss": 0.0692, "step": 64550 }, { "epoch": 1.62, "learning_rate": 0.00056701756149034, "loss": 0.0661, "step": 64560 }, { "epoch": 1.62, "learning_rate": 0.0005666407054744617, "loss": 0.0655, "step": 64570 }, { "epoch": 1.62, "learning_rate": 0.0005662638494585836, "loss": 0.0658, "step": 64580 }, { "epoch": 1.62, "learning_rate": 0.0005658869934427054, "loss": 0.0648, "step": 64590 }, { "epoch": 1.62, "learning_rate": 0.0005655101374268272, "loss": 0.0638, "step": 64600 }, { "epoch": 1.62, "learning_rate": 0.000565133281410949, "loss": 0.0643, "step": 64610 }, { "epoch": 1.62, "learning_rate": 0.0005647564253950708, "loss": 0.0643, "step": 64620 }, { "epoch": 1.62, "learning_rate": 0.0005643795693791926, "loss": 0.0664, "step": 64630 }, { "epoch": 1.62, "learning_rate": 0.0005640027133633142, "loss": 0.0682, "step": 64640 }, { "epoch": 1.62, "learning_rate": 0.0005636258573474361, "loss": 0.0688, "step": 64650 }, { "epoch": 1.62, "learning_rate": 0.000563249001331558, "loss": 0.0664, "step": 64660 }, { "epoch": 1.62, "learning_rate": 0.0005628721453156797, "loss": 0.0647, "step": 64670 }, { "epoch": 1.62, "learning_rate": 0.0005624952892998015, "loss": 0.0635, "step": 64680 }, { "epoch": 1.63, "learning_rate": 0.0005621184332839233, "loss": 0.0644, "step": 64690 }, { "epoch": 1.63, "learning_rate": 0.0005617415772680451, "loss": 0.0669, "step": 64700 }, { "epoch": 1.63, "learning_rate": 0.0005613647212521669, "loss": 0.0636, "step": 64710 }, { "epoch": 1.63, "learning_rate": 0.0005609878652362887, "loss": 0.0647, "step": 64720 }, { "epoch": 1.63, "learning_rate": 0.0005606110092204105, "loss": 0.0663, "step": 64730 }, { "epoch": 1.63, "learning_rate": 0.0005602341532045323, "loss": 0.0654, "step": 64740 }, { "epoch": 1.63, "learning_rate": 0.0005598572971886541, "loss": 0.0649, "step": 64750 }, { "epoch": 1.63, "learning_rate": 0.0005594804411727759, "loss": 0.0633, "step": 64760 }, { "epoch": 1.63, "learning_rate": 0.0005591035851568978, "loss": 0.0635, "step": 64770 }, { "epoch": 1.63, "learning_rate": 0.0005587267291410195, "loss": 0.0627, "step": 64780 }, { "epoch": 1.63, "learning_rate": 0.0005583498731251414, "loss": 0.064, "step": 64790 }, { "epoch": 1.63, "learning_rate": 0.0005579730171092631, "loss": 0.0653, "step": 64800 }, { "epoch": 1.63, "learning_rate": 0.000557596161093385, "loss": 0.063, "step": 64810 }, { "epoch": 1.63, "learning_rate": 0.0005572193050775067, "loss": 0.0668, "step": 64820 }, { "epoch": 1.63, "learning_rate": 0.0005568424490616286, "loss": 0.0655, "step": 64830 }, { "epoch": 1.63, "learning_rate": 0.0005564655930457503, "loss": 0.0681, "step": 64840 }, { "epoch": 1.63, "learning_rate": 0.0005560887370298722, "loss": 0.0654, "step": 64850 }, { "epoch": 1.63, "learning_rate": 0.0005557118810139939, "loss": 0.0632, "step": 64860 }, { "epoch": 1.63, "learning_rate": 0.0005553350249981157, "loss": 0.0668, "step": 64870 }, { "epoch": 1.63, "learning_rate": 0.0005549581689822375, "loss": 0.0655, "step": 64880 }, { "epoch": 1.63, "learning_rate": 0.0005545813129663593, "loss": 0.0659, "step": 64890 }, { "epoch": 1.63, "learning_rate": 0.0005542044569504811, "loss": 0.0676, "step": 64900 }, { "epoch": 1.63, "learning_rate": 0.0005538276009346029, "loss": 0.0656, "step": 64910 }, { "epoch": 1.63, "learning_rate": 0.0005534507449187247, "loss": 0.0672, "step": 64920 }, { "epoch": 1.63, "learning_rate": 0.0005530738889028465, "loss": 0.0659, "step": 64930 }, { "epoch": 1.63, "learning_rate": 0.0005526970328869683, "loss": 0.0657, "step": 64940 }, { "epoch": 1.63, "learning_rate": 0.0005523201768710902, "loss": 0.0641, "step": 64950 }, { "epoch": 1.63, "learning_rate": 0.0005519433208552119, "loss": 0.0668, "step": 64960 }, { "epoch": 1.63, "learning_rate": 0.0005515664648393338, "loss": 0.0665, "step": 64970 }, { "epoch": 1.63, "learning_rate": 0.0005511896088234555, "loss": 0.067, "step": 64980 }, { "epoch": 1.63, "learning_rate": 0.0005508127528075774, "loss": 0.0687, "step": 64990 }, { "epoch": 1.63, "learning_rate": 0.0005504358967916991, "loss": 0.0649, "step": 65000 }, { "epoch": 1.63, "eval_cer": 0.6651690778712488, "eval_loss": 0.05603507161140442, "eval_runtime": 90.44, "eval_samples_per_second": 110.559, "eval_steps_per_second": 6.911, "step": 65000 }, { "epoch": 1.63, "learning_rate": 0.000550059040775821, "loss": 0.0629, "step": 65010 }, { "epoch": 1.63, "learning_rate": 0.0005496821847599427, "loss": 0.0616, "step": 65020 }, { "epoch": 1.63, "learning_rate": 0.0005493053287440646, "loss": 0.0668, "step": 65030 }, { "epoch": 1.63, "learning_rate": 0.0005489284727281863, "loss": 0.064, "step": 65040 }, { "epoch": 1.63, "learning_rate": 0.0005485516167123082, "loss": 0.0649, "step": 65050 }, { "epoch": 1.63, "learning_rate": 0.00054817476069643, "loss": 0.065, "step": 65060 }, { "epoch": 1.63, "learning_rate": 0.0005477979046805518, "loss": 0.0659, "step": 65070 }, { "epoch": 1.64, "learning_rate": 0.0005474210486646735, "loss": 0.0644, "step": 65080 }, { "epoch": 1.64, "learning_rate": 0.0005470441926487952, "loss": 0.0645, "step": 65090 }, { "epoch": 1.64, "learning_rate": 0.0005466673366329171, "loss": 0.0669, "step": 65100 }, { "epoch": 1.64, "learning_rate": 0.0005462904806170388, "loss": 0.0662, "step": 65110 }, { "epoch": 1.64, "learning_rate": 0.0005459136246011607, "loss": 0.068, "step": 65120 }, { "epoch": 1.64, "learning_rate": 0.0005455367685852826, "loss": 0.0655, "step": 65130 }, { "epoch": 1.64, "learning_rate": 0.0005451599125694043, "loss": 0.0704, "step": 65140 }, { "epoch": 1.64, "learning_rate": 0.0005447830565535261, "loss": 0.0653, "step": 65150 }, { "epoch": 1.64, "learning_rate": 0.0005444062005376479, "loss": 0.0651, "step": 65160 }, { "epoch": 1.64, "learning_rate": 0.0005440293445217697, "loss": 0.0663, "step": 65170 }, { "epoch": 1.64, "learning_rate": 0.0005436524885058915, "loss": 0.0675, "step": 65180 }, { "epoch": 1.64, "learning_rate": 0.0005432756324900133, "loss": 0.0658, "step": 65190 }, { "epoch": 1.64, "learning_rate": 0.0005428987764741351, "loss": 0.0637, "step": 65200 }, { "epoch": 1.64, "learning_rate": 0.0005425219204582569, "loss": 0.0678, "step": 65210 }, { "epoch": 1.64, "learning_rate": 0.0005421450644423787, "loss": 0.0674, "step": 65220 }, { "epoch": 1.64, "learning_rate": 0.0005417682084265005, "loss": 0.0656, "step": 65230 }, { "epoch": 1.64, "learning_rate": 0.0005413913524106224, "loss": 0.0645, "step": 65240 }, { "epoch": 1.64, "learning_rate": 0.0005410144963947441, "loss": 0.0657, "step": 65250 }, { "epoch": 1.64, "learning_rate": 0.000540637640378866, "loss": 0.0663, "step": 65260 }, { "epoch": 1.64, "learning_rate": 0.0005402607843629877, "loss": 0.0638, "step": 65270 }, { "epoch": 1.64, "learning_rate": 0.0005398839283471096, "loss": 0.0677, "step": 65280 }, { "epoch": 1.64, "learning_rate": 0.0005395070723312313, "loss": 0.0631, "step": 65290 }, { "epoch": 1.64, "learning_rate": 0.0005391302163153532, "loss": 0.0664, "step": 65300 }, { "epoch": 1.64, "learning_rate": 0.0005387533602994749, "loss": 0.0653, "step": 65310 }, { "epoch": 1.64, "learning_rate": 0.0005383765042835967, "loss": 0.066, "step": 65320 }, { "epoch": 1.64, "learning_rate": 0.0005379996482677185, "loss": 0.0665, "step": 65330 }, { "epoch": 1.64, "learning_rate": 0.0005376227922518403, "loss": 0.0672, "step": 65340 }, { "epoch": 1.64, "learning_rate": 0.0005372459362359621, "loss": 0.0644, "step": 65350 }, { "epoch": 1.64, "learning_rate": 0.0005368690802200839, "loss": 0.0683, "step": 65360 }, { "epoch": 1.64, "learning_rate": 0.0005364922242042057, "loss": 0.0643, "step": 65370 }, { "epoch": 1.64, "learning_rate": 0.0005361153681883275, "loss": 0.066, "step": 65380 }, { "epoch": 1.64, "learning_rate": 0.0005357385121724493, "loss": 0.0647, "step": 65390 }, { "epoch": 1.64, "learning_rate": 0.0005353616561565711, "loss": 0.0621, "step": 65400 }, { "epoch": 1.64, "learning_rate": 0.0005349848001406929, "loss": 0.0645, "step": 65410 }, { "epoch": 1.64, "learning_rate": 0.0005346079441248148, "loss": 0.0677, "step": 65420 }, { "epoch": 1.64, "learning_rate": 0.0005342310881089365, "loss": 0.0653, "step": 65430 }, { "epoch": 1.64, "learning_rate": 0.0005338542320930584, "loss": 0.07, "step": 65440 }, { "epoch": 1.64, "learning_rate": 0.0005334773760771801, "loss": 0.0645, "step": 65450 }, { "epoch": 1.64, "learning_rate": 0.000533100520061302, "loss": 0.0657, "step": 65460 }, { "epoch": 1.64, "learning_rate": 0.0005327236640454237, "loss": 0.0654, "step": 65470 }, { "epoch": 1.65, "learning_rate": 0.0005323468080295456, "loss": 0.0639, "step": 65480 }, { "epoch": 1.65, "learning_rate": 0.0005319699520136673, "loss": 0.0633, "step": 65490 }, { "epoch": 1.65, "learning_rate": 0.0005315930959977892, "loss": 0.0654, "step": 65500 }, { "epoch": 1.65, "eval_cer": 0.6653707133806576, "eval_loss": 0.0557679682970047, "eval_runtime": 90.7481, "eval_samples_per_second": 110.184, "eval_steps_per_second": 6.887, "step": 65500 }, { "epoch": 1.65, "learning_rate": 0.0005312162399819109, "loss": 0.0639, "step": 65510 }, { "epoch": 1.65, "learning_rate": 0.0005308393839660328, "loss": 0.0685, "step": 65520 }, { "epoch": 1.65, "learning_rate": 0.0005304625279501545, "loss": 0.0661, "step": 65530 }, { "epoch": 1.65, "learning_rate": 0.0005300856719342762, "loss": 0.066, "step": 65540 }, { "epoch": 1.65, "learning_rate": 0.0005297088159183981, "loss": 0.0622, "step": 65550 }, { "epoch": 1.65, "learning_rate": 0.0005293319599025198, "loss": 0.0649, "step": 65560 }, { "epoch": 1.65, "learning_rate": 0.0005289551038866417, "loss": 0.0658, "step": 65570 }, { "epoch": 1.65, "learning_rate": 0.0005285782478707636, "loss": 0.0627, "step": 65580 }, { "epoch": 1.65, "learning_rate": 0.0005282013918548853, "loss": 0.0638, "step": 65590 }, { "epoch": 1.65, "learning_rate": 0.0005278245358390072, "loss": 0.0647, "step": 65600 }, { "epoch": 1.65, "learning_rate": 0.0005274476798231289, "loss": 0.0678, "step": 65610 }, { "epoch": 1.65, "learning_rate": 0.0005270708238072507, "loss": 0.0658, "step": 65620 }, { "epoch": 1.65, "learning_rate": 0.0005266939677913725, "loss": 0.066, "step": 65630 }, { "epoch": 1.65, "learning_rate": 0.0005263171117754943, "loss": 0.0658, "step": 65640 }, { "epoch": 1.65, "learning_rate": 0.0005259402557596161, "loss": 0.0644, "step": 65650 }, { "epoch": 1.65, "learning_rate": 0.0005255633997437379, "loss": 0.0633, "step": 65660 }, { "epoch": 1.65, "learning_rate": 0.0005251865437278597, "loss": 0.0645, "step": 65670 }, { "epoch": 1.65, "learning_rate": 0.0005248096877119815, "loss": 0.0627, "step": 65680 }, { "epoch": 1.65, "learning_rate": 0.0005244328316961034, "loss": 0.0643, "step": 65690 }, { "epoch": 1.65, "learning_rate": 0.0005240559756802251, "loss": 0.064, "step": 65700 }, { "epoch": 1.65, "learning_rate": 0.000523679119664347, "loss": 0.0699, "step": 65710 }, { "epoch": 1.65, "learning_rate": 0.0005233022636484687, "loss": 0.0665, "step": 65720 }, { "epoch": 1.65, "learning_rate": 0.0005229254076325906, "loss": 0.0674, "step": 65730 }, { "epoch": 1.65, "learning_rate": 0.0005225485516167123, "loss": 0.0638, "step": 65740 }, { "epoch": 1.65, "learning_rate": 0.0005221716956008341, "loss": 0.0632, "step": 65750 }, { "epoch": 1.65, "learning_rate": 0.0005217948395849559, "loss": 0.0636, "step": 65760 }, { "epoch": 1.65, "learning_rate": 0.0005214179835690777, "loss": 0.066, "step": 65770 }, { "epoch": 1.65, "learning_rate": 0.0005210411275531995, "loss": 0.0657, "step": 65780 }, { "epoch": 1.65, "learning_rate": 0.0005206642715373213, "loss": 0.0628, "step": 65790 }, { "epoch": 1.65, "learning_rate": 0.0005202874155214431, "loss": 0.0642, "step": 65800 }, { "epoch": 1.65, "learning_rate": 0.0005199105595055649, "loss": 0.0656, "step": 65810 }, { "epoch": 1.65, "learning_rate": 0.0005195337034896867, "loss": 0.0672, "step": 65820 }, { "epoch": 1.65, "learning_rate": 0.0005191568474738085, "loss": 0.0685, "step": 65830 }, { "epoch": 1.65, "learning_rate": 0.0005187799914579303, "loss": 0.0626, "step": 65840 }, { "epoch": 1.65, "learning_rate": 0.0005184031354420521, "loss": 0.0654, "step": 65850 }, { "epoch": 1.65, "learning_rate": 0.0005180262794261739, "loss": 0.0644, "step": 65860 }, { "epoch": 1.65, "learning_rate": 0.0005176494234102958, "loss": 0.0666, "step": 65870 }, { "epoch": 1.66, "learning_rate": 0.0005172725673944175, "loss": 0.0637, "step": 65880 }, { "epoch": 1.66, "learning_rate": 0.0005168957113785394, "loss": 0.0681, "step": 65890 }, { "epoch": 1.66, "learning_rate": 0.0005165188553626611, "loss": 0.0655, "step": 65900 }, { "epoch": 1.66, "learning_rate": 0.000516141999346783, "loss": 0.065, "step": 65910 }, { "epoch": 1.66, "learning_rate": 0.0005157651433309047, "loss": 0.0626, "step": 65920 }, { "epoch": 1.66, "learning_rate": 0.0005153882873150266, "loss": 0.066, "step": 65930 }, { "epoch": 1.66, "learning_rate": 0.0005150114312991483, "loss": 0.066, "step": 65940 }, { "epoch": 1.66, "learning_rate": 0.0005146345752832702, "loss": 0.0675, "step": 65950 }, { "epoch": 1.66, "learning_rate": 0.0005142577192673919, "loss": 0.0637, "step": 65960 }, { "epoch": 1.66, "learning_rate": 0.0005138808632515137, "loss": 0.0619, "step": 65970 }, { "epoch": 1.66, "learning_rate": 0.0005135040072356355, "loss": 0.0646, "step": 65980 }, { "epoch": 1.66, "learning_rate": 0.0005131271512197573, "loss": 0.0666, "step": 65990 }, { "epoch": 1.66, "learning_rate": 0.0005127502952038791, "loss": 0.0675, "step": 66000 }, { "epoch": 1.66, "eval_cer": 0.6653572389313415, "eval_loss": 0.055686622858047485, "eval_runtime": 90.4669, "eval_samples_per_second": 110.527, "eval_steps_per_second": 6.909, "step": 66000 }, { "epoch": 1.66, "learning_rate": 0.0005123734391880008, "loss": 0.0614, "step": 66010 }, { "epoch": 1.66, "learning_rate": 0.0005119965831721227, "loss": 0.06, "step": 66020 }, { "epoch": 1.66, "learning_rate": 0.0005116197271562444, "loss": 0.066, "step": 66030 }, { "epoch": 1.66, "learning_rate": 0.0005112428711403663, "loss": 0.0651, "step": 66040 }, { "epoch": 1.66, "learning_rate": 0.0005108660151244882, "loss": 0.0605, "step": 66050 }, { "epoch": 1.66, "learning_rate": 0.0005104891591086099, "loss": 0.066, "step": 66060 }, { "epoch": 1.66, "learning_rate": 0.0005101123030927318, "loss": 0.0629, "step": 66070 }, { "epoch": 1.66, "learning_rate": 0.0005097354470768535, "loss": 0.0677, "step": 66080 }, { "epoch": 1.66, "learning_rate": 0.0005093585910609753, "loss": 0.0661, "step": 66090 }, { "epoch": 1.66, "learning_rate": 0.0005089817350450971, "loss": 0.0614, "step": 66100 }, { "epoch": 1.66, "learning_rate": 0.000508604879029219, "loss": 0.065, "step": 66110 }, { "epoch": 1.66, "learning_rate": 0.0005082280230133407, "loss": 0.066, "step": 66120 }, { "epoch": 1.66, "learning_rate": 0.0005078511669974625, "loss": 0.0661, "step": 66130 }, { "epoch": 1.66, "learning_rate": 0.0005074743109815843, "loss": 0.0672, "step": 66140 }, { "epoch": 1.66, "learning_rate": 0.0005070974549657061, "loss": 0.0624, "step": 66150 }, { "epoch": 1.66, "learning_rate": 0.000506720598949828, "loss": 0.0657, "step": 66160 }, { "epoch": 1.66, "learning_rate": 0.0005063437429339497, "loss": 0.0635, "step": 66170 }, { "epoch": 1.66, "learning_rate": 0.0005059668869180716, "loss": 0.0648, "step": 66180 }, { "epoch": 1.66, "learning_rate": 0.0005055900309021933, "loss": 0.0635, "step": 66190 }, { "epoch": 1.66, "learning_rate": 0.0005052131748863151, "loss": 0.0688, "step": 66200 }, { "epoch": 1.66, "learning_rate": 0.0005048363188704368, "loss": 0.0642, "step": 66210 }, { "epoch": 1.66, "learning_rate": 0.0005044594628545587, "loss": 0.0639, "step": 66220 }, { "epoch": 1.66, "learning_rate": 0.0005040826068386805, "loss": 0.0654, "step": 66230 }, { "epoch": 1.66, "learning_rate": 0.0005037057508228023, "loss": 0.0638, "step": 66240 }, { "epoch": 1.66, "learning_rate": 0.0005033288948069241, "loss": 0.0643, "step": 66250 }, { "epoch": 1.66, "learning_rate": 0.0005029520387910459, "loss": 0.0629, "step": 66260 }, { "epoch": 1.66, "learning_rate": 0.0005025751827751677, "loss": 0.0676, "step": 66270 }, { "epoch": 1.67, "learning_rate": 0.0005021983267592895, "loss": 0.0636, "step": 66280 }, { "epoch": 1.67, "learning_rate": 0.0005018214707434113, "loss": 0.064, "step": 66290 }, { "epoch": 1.67, "learning_rate": 0.0005014446147275331, "loss": 0.0663, "step": 66300 }, { "epoch": 1.67, "learning_rate": 0.0005010677587116549, "loss": 0.0632, "step": 66310 }, { "epoch": 1.67, "learning_rate": 0.0005006909026957767, "loss": 0.0647, "step": 66320 }, { "epoch": 1.67, "learning_rate": 0.0005003140466798985, "loss": 0.0668, "step": 66330 }, { "epoch": 1.67, "learning_rate": 0.0004999371906640204, "loss": 0.063, "step": 66340 }, { "epoch": 1.67, "learning_rate": 0.0004995603346481421, "loss": 0.0659, "step": 66350 }, { "epoch": 1.67, "learning_rate": 0.000499183478632264, "loss": 0.0625, "step": 66360 }, { "epoch": 1.67, "learning_rate": 0.0004988066226163857, "loss": 0.0643, "step": 66370 }, { "epoch": 1.67, "learning_rate": 0.0004984297666005076, "loss": 0.0633, "step": 66380 }, { "epoch": 1.67, "learning_rate": 0.0004980529105846293, "loss": 0.0624, "step": 66390 }, { "epoch": 1.67, "learning_rate": 0.0004976760545687512, "loss": 0.0631, "step": 66400 }, { "epoch": 1.67, "learning_rate": 0.0004972991985528729, "loss": 0.0695, "step": 66410 }, { "epoch": 1.67, "learning_rate": 0.0004969223425369947, "loss": 0.0637, "step": 66420 }, { "epoch": 1.67, "learning_rate": 0.0004965454865211165, "loss": 0.0675, "step": 66430 }, { "epoch": 1.67, "learning_rate": 0.0004961686305052383, "loss": 0.0655, "step": 66440 }, { "epoch": 1.67, "learning_rate": 0.0004957917744893601, "loss": 0.0669, "step": 66450 }, { "epoch": 1.67, "learning_rate": 0.0004954149184734819, "loss": 0.0624, "step": 66460 }, { "epoch": 1.67, "learning_rate": 0.0004950380624576037, "loss": 0.0642, "step": 66470 }, { "epoch": 1.67, "learning_rate": 0.0004946612064417254, "loss": 0.0632, "step": 66480 }, { "epoch": 1.67, "learning_rate": 0.0004942843504258473, "loss": 0.062, "step": 66490 }, { "epoch": 1.67, "learning_rate": 0.000493907494409969, "loss": 0.0642, "step": 66500 }, { "epoch": 1.67, "eval_cer": 0.6652633990164615, "eval_loss": 0.05538139119744301, "eval_runtime": 90.5902, "eval_samples_per_second": 110.376, "eval_steps_per_second": 6.899, "step": 66500 }, { "epoch": 1.67, "learning_rate": 0.0004935306383940909, "loss": 0.0635, "step": 66510 }, { "epoch": 1.67, "learning_rate": 0.0004931537823782128, "loss": 0.0623, "step": 66520 }, { "epoch": 1.67, "learning_rate": 0.0004927769263623345, "loss": 0.0643, "step": 66530 }, { "epoch": 1.67, "learning_rate": 0.0004924000703464564, "loss": 0.0654, "step": 66540 }, { "epoch": 1.67, "learning_rate": 0.0004920232143305781, "loss": 0.0633, "step": 66550 }, { "epoch": 1.67, "learning_rate": 0.0004916463583147, "loss": 0.0623, "step": 66560 }, { "epoch": 1.67, "learning_rate": 0.0004912695022988217, "loss": 0.0653, "step": 66570 }, { "epoch": 1.67, "learning_rate": 0.0004908926462829435, "loss": 0.0664, "step": 66580 }, { "epoch": 1.67, "learning_rate": 0.0004905157902670653, "loss": 0.0634, "step": 66590 }, { "epoch": 1.67, "learning_rate": 0.0004901389342511871, "loss": 0.0645, "step": 66600 }, { "epoch": 1.67, "learning_rate": 0.0004897620782353089, "loss": 0.0648, "step": 66610 }, { "epoch": 1.67, "learning_rate": 0.0004893852222194307, "loss": 0.0649, "step": 66620 }, { "epoch": 1.67, "learning_rate": 0.0004890083662035526, "loss": 0.0646, "step": 66630 }, { "epoch": 1.67, "learning_rate": 0.0004886315101876742, "loss": 0.0655, "step": 66640 }, { "epoch": 1.67, "learning_rate": 0.0004882546541717961, "loss": 0.068, "step": 66650 }, { "epoch": 1.67, "learning_rate": 0.0004878777981559179, "loss": 0.0673, "step": 66660 }, { "epoch": 1.67, "learning_rate": 0.0004875009421400397, "loss": 0.0641, "step": 66670 }, { "epoch": 1.68, "learning_rate": 0.0004871240861241615, "loss": 0.0661, "step": 66680 }, { "epoch": 1.68, "learning_rate": 0.0004867472301082833, "loss": 0.0666, "step": 66690 }, { "epoch": 1.68, "learning_rate": 0.0004863703740924051, "loss": 0.0673, "step": 66700 }, { "epoch": 1.68, "learning_rate": 0.0004859935180765269, "loss": 0.0659, "step": 66710 }, { "epoch": 1.68, "learning_rate": 0.0004856166620606487, "loss": 0.0659, "step": 66720 }, { "epoch": 1.68, "learning_rate": 0.0004852398060447705, "loss": 0.0659, "step": 66730 }, { "epoch": 1.68, "learning_rate": 0.0004848629500288923, "loss": 0.0636, "step": 66740 }, { "epoch": 1.68, "learning_rate": 0.0004844860940130141, "loss": 0.0669, "step": 66750 }, { "epoch": 1.68, "learning_rate": 0.0004841092379971359, "loss": 0.0649, "step": 66760 }, { "epoch": 1.68, "learning_rate": 0.0004837323819812577, "loss": 0.0637, "step": 66770 }, { "epoch": 1.68, "learning_rate": 0.0004833555259653795, "loss": 0.0647, "step": 66780 }, { "epoch": 1.68, "learning_rate": 0.0004829786699495013, "loss": 0.0651, "step": 66790 }, { "epoch": 1.68, "learning_rate": 0.0004826018139336231, "loss": 0.0656, "step": 66800 }, { "epoch": 1.68, "learning_rate": 0.0004822249579177449, "loss": 0.0657, "step": 66810 }, { "epoch": 1.68, "learning_rate": 0.0004818481019018667, "loss": 0.0638, "step": 66820 }, { "epoch": 1.68, "learning_rate": 0.0004814712458859885, "loss": 0.0625, "step": 66830 }, { "epoch": 1.68, "learning_rate": 0.0004810943898701103, "loss": 0.0637, "step": 66840 }, { "epoch": 1.68, "learning_rate": 0.00048071753385423217, "loss": 0.0656, "step": 66850 }, { "epoch": 1.68, "learning_rate": 0.00048034067783835386, "loss": 0.0632, "step": 66860 }, { "epoch": 1.68, "learning_rate": 0.00047996382182247566, "loss": 0.0643, "step": 66870 }, { "epoch": 1.68, "learning_rate": 0.00047958696580659746, "loss": 0.0636, "step": 66880 }, { "epoch": 1.68, "learning_rate": 0.00047921010979071926, "loss": 0.0649, "step": 66890 }, { "epoch": 1.68, "learning_rate": 0.00047883325377484105, "loss": 0.0657, "step": 66900 }, { "epoch": 1.68, "learning_rate": 0.0004784563977589629, "loss": 0.0675, "step": 66910 }, { "epoch": 1.68, "learning_rate": 0.0004780795417430847, "loss": 0.0676, "step": 66920 }, { "epoch": 1.68, "learning_rate": 0.0004777026857272065, "loss": 0.0649, "step": 66930 }, { "epoch": 1.68, "learning_rate": 0.0004773258297113283, "loss": 0.0616, "step": 66940 }, { "epoch": 1.68, "learning_rate": 0.0004769489736954501, "loss": 0.0631, "step": 66950 }, { "epoch": 1.68, "learning_rate": 0.0004765721176795719, "loss": 0.0618, "step": 66960 }, { "epoch": 1.68, "learning_rate": 0.0004761952616636937, "loss": 0.0641, "step": 66970 }, { "epoch": 1.68, "learning_rate": 0.0004758184056478155, "loss": 0.0636, "step": 66980 }, { "epoch": 1.68, "learning_rate": 0.0004754415496319373, "loss": 0.0654, "step": 66990 }, { "epoch": 1.68, "learning_rate": 0.0004750646936160591, "loss": 0.0631, "step": 67000 }, { "epoch": 1.68, "eval_cer": 0.6653168155833932, "eval_loss": 0.055216867476701736, "eval_runtime": 90.7608, "eval_samples_per_second": 110.169, "eval_steps_per_second": 6.886, "step": 67000 }, { "epoch": 1.68, "learning_rate": 0.0004746878376001809, "loss": 0.0644, "step": 67010 }, { "epoch": 1.68, "learning_rate": 0.0004743109815843027, "loss": 0.0647, "step": 67020 }, { "epoch": 1.68, "learning_rate": 0.00047393412556842455, "loss": 0.0632, "step": 67030 }, { "epoch": 1.68, "learning_rate": 0.00047355726955254635, "loss": 0.062, "step": 67040 }, { "epoch": 1.68, "learning_rate": 0.00047318041353666815, "loss": 0.0641, "step": 67050 }, { "epoch": 1.68, "learning_rate": 0.00047280355752078994, "loss": 0.0653, "step": 67060 }, { "epoch": 1.69, "learning_rate": 0.00047242670150491174, "loss": 0.0645, "step": 67070 }, { "epoch": 1.69, "learning_rate": 0.00047204984548903343, "loss": 0.0645, "step": 67080 }, { "epoch": 1.69, "learning_rate": 0.0004716729894731553, "loss": 0.0659, "step": 67090 }, { "epoch": 1.69, "learning_rate": 0.0004712961334572771, "loss": 0.0632, "step": 67100 }, { "epoch": 1.69, "learning_rate": 0.0004709192774413989, "loss": 0.0632, "step": 67110 }, { "epoch": 1.69, "learning_rate": 0.0004705424214255207, "loss": 0.0652, "step": 67120 }, { "epoch": 1.69, "learning_rate": 0.0004701655654096425, "loss": 0.0635, "step": 67130 }, { "epoch": 1.69, "learning_rate": 0.0004697887093937643, "loss": 0.0662, "step": 67140 }, { "epoch": 1.69, "learning_rate": 0.0004694118533778861, "loss": 0.0637, "step": 67150 }, { "epoch": 1.69, "learning_rate": 0.0004690349973620079, "loss": 0.0631, "step": 67160 }, { "epoch": 1.69, "learning_rate": 0.0004686581413461297, "loss": 0.0635, "step": 67170 }, { "epoch": 1.69, "learning_rate": 0.0004682812853302515, "loss": 0.0649, "step": 67180 }, { "epoch": 1.69, "learning_rate": 0.0004679044293143733, "loss": 0.0615, "step": 67190 }, { "epoch": 1.69, "learning_rate": 0.00046752757329849513, "loss": 0.0638, "step": 67200 }, { "epoch": 1.69, "learning_rate": 0.0004671507172826169, "loss": 0.0635, "step": 67210 }, { "epoch": 1.69, "learning_rate": 0.0004667738612667387, "loss": 0.0627, "step": 67220 }, { "epoch": 1.69, "learning_rate": 0.0004663970052508605, "loss": 0.0625, "step": 67230 }, { "epoch": 1.69, "learning_rate": 0.0004660201492349823, "loss": 0.065, "step": 67240 }, { "epoch": 1.69, "learning_rate": 0.0004656432932191041, "loss": 0.0622, "step": 67250 }, { "epoch": 1.69, "learning_rate": 0.0004652664372032259, "loss": 0.061, "step": 67260 }, { "epoch": 1.69, "learning_rate": 0.0004648895811873477, "loss": 0.0652, "step": 67270 }, { "epoch": 1.69, "learning_rate": 0.0004645127251714695, "loss": 0.0642, "step": 67280 }, { "epoch": 1.69, "learning_rate": 0.0004641358691555913, "loss": 0.0662, "step": 67290 }, { "epoch": 1.69, "learning_rate": 0.0004637590131397131, "loss": 0.0655, "step": 67300 }, { "epoch": 1.69, "learning_rate": 0.00046338215712383486, "loss": 0.0635, "step": 67310 }, { "epoch": 1.69, "learning_rate": 0.00046300530110795666, "loss": 0.0662, "step": 67320 }, { "epoch": 1.69, "learning_rate": 0.00046262844509207846, "loss": 0.065, "step": 67330 }, { "epoch": 1.69, "learning_rate": 0.00046225158907620026, "loss": 0.0637, "step": 67340 }, { "epoch": 1.69, "learning_rate": 0.00046187473306032206, "loss": 0.0661, "step": 67350 }, { "epoch": 1.69, "learning_rate": 0.00046149787704444385, "loss": 0.0652, "step": 67360 }, { "epoch": 1.69, "learning_rate": 0.00046112102102856565, "loss": 0.0644, "step": 67370 }, { "epoch": 1.69, "learning_rate": 0.0004607441650126875, "loss": 0.0658, "step": 67380 }, { "epoch": 1.69, "learning_rate": 0.0004603673089968093, "loss": 0.0686, "step": 67390 }, { "epoch": 1.69, "learning_rate": 0.0004599904529809311, "loss": 0.065, "step": 67400 }, { "epoch": 1.69, "learning_rate": 0.0004596135969650529, "loss": 0.0682, "step": 67410 }, { "epoch": 1.69, "learning_rate": 0.0004592367409491747, "loss": 0.063, "step": 67420 }, { "epoch": 1.69, "learning_rate": 0.0004588598849332965, "loss": 0.0654, "step": 67430 }, { "epoch": 1.69, "learning_rate": 0.0004584830289174183, "loss": 0.0643, "step": 67440 }, { "epoch": 1.69, "learning_rate": 0.0004581061729015401, "loss": 0.0652, "step": 67450 }, { "epoch": 1.69, "learning_rate": 0.0004577293168856619, "loss": 0.0653, "step": 67460 }, { "epoch": 1.7, "learning_rate": 0.0004573524608697837, "loss": 0.0661, "step": 67470 }, { "epoch": 1.7, "learning_rate": 0.0004569756048539055, "loss": 0.0639, "step": 67480 }, { "epoch": 1.7, "learning_rate": 0.00045659874883802735, "loss": 0.0663, "step": 67490 }, { "epoch": 1.7, "learning_rate": 0.00045622189282214915, "loss": 0.0628, "step": 67500 }, { "epoch": 1.7, "eval_cer": 0.6652359688874965, "eval_loss": 0.05516913905739784, "eval_runtime": 90.7509, "eval_samples_per_second": 110.181, "eval_steps_per_second": 6.887, "step": 67500 }, { "epoch": 1.7, "learning_rate": 0.00045584503680627095, "loss": 0.0653, "step": 67510 }, { "epoch": 1.7, "learning_rate": 0.00045546818079039274, "loss": 0.0623, "step": 67520 }, { "epoch": 1.7, "learning_rate": 0.00045509132477451443, "loss": 0.0636, "step": 67530 }, { "epoch": 1.7, "learning_rate": 0.00045471446875863623, "loss": 0.0632, "step": 67540 }, { "epoch": 1.7, "learning_rate": 0.0004543376127427581, "loss": 0.0632, "step": 67550 }, { "epoch": 1.7, "learning_rate": 0.0004539607567268799, "loss": 0.0662, "step": 67560 }, { "epoch": 1.7, "learning_rate": 0.0004535839007110017, "loss": 0.0645, "step": 67570 }, { "epoch": 1.7, "learning_rate": 0.0004532070446951235, "loss": 0.0639, "step": 67580 }, { "epoch": 1.7, "learning_rate": 0.0004528301886792453, "loss": 0.0679, "step": 67590 }, { "epoch": 1.7, "learning_rate": 0.0004524533326633671, "loss": 0.0674, "step": 67600 }, { "epoch": 1.7, "learning_rate": 0.0004520764766474889, "loss": 0.0624, "step": 67610 }, { "epoch": 1.7, "learning_rate": 0.0004516996206316107, "loss": 0.0614, "step": 67620 }, { "epoch": 1.7, "learning_rate": 0.0004513227646157325, "loss": 0.062, "step": 67630 }, { "epoch": 1.7, "learning_rate": 0.0004509459085998543, "loss": 0.0642, "step": 67640 }, { "epoch": 1.7, "learning_rate": 0.0004505690525839761, "loss": 0.0649, "step": 67650 }, { "epoch": 1.7, "learning_rate": 0.0004501921965680979, "loss": 0.0637, "step": 67660 }, { "epoch": 1.7, "learning_rate": 0.00044981534055221973, "loss": 0.0626, "step": 67670 }, { "epoch": 1.7, "learning_rate": 0.0004494384845363415, "loss": 0.0662, "step": 67680 }, { "epoch": 1.7, "learning_rate": 0.0004490616285204633, "loss": 0.0695, "step": 67690 }, { "epoch": 1.7, "learning_rate": 0.0004486847725045851, "loss": 0.066, "step": 67700 }, { "epoch": 1.7, "learning_rate": 0.0004483079164887069, "loss": 0.0671, "step": 67710 }, { "epoch": 1.7, "learning_rate": 0.0004479310604728287, "loss": 0.0642, "step": 67720 }, { "epoch": 1.7, "learning_rate": 0.0004475542044569505, "loss": 0.0618, "step": 67730 }, { "epoch": 1.7, "learning_rate": 0.0004471773484410723, "loss": 0.0681, "step": 67740 }, { "epoch": 1.7, "learning_rate": 0.00044680049242519406, "loss": 0.0649, "step": 67750 }, { "epoch": 1.7, "learning_rate": 0.00044642363640931586, "loss": 0.0679, "step": 67760 }, { "epoch": 1.7, "learning_rate": 0.00044604678039343766, "loss": 0.0629, "step": 67770 }, { "epoch": 1.7, "learning_rate": 0.00044566992437755946, "loss": 0.067, "step": 67780 }, { "epoch": 1.7, "learning_rate": 0.00044529306836168126, "loss": 0.0653, "step": 67790 }, { "epoch": 1.7, "learning_rate": 0.00044491621234580306, "loss": 0.0646, "step": 67800 }, { "epoch": 1.7, "learning_rate": 0.00044453935632992486, "loss": 0.0647, "step": 67810 }, { "epoch": 1.7, "learning_rate": 0.00044416250031404666, "loss": 0.0633, "step": 67820 }, { "epoch": 1.7, "learning_rate": 0.00044378564429816845, "loss": 0.0661, "step": 67830 }, { "epoch": 1.7, "learning_rate": 0.0004434087882822903, "loss": 0.0662, "step": 67840 }, { "epoch": 1.7, "learning_rate": 0.0004430319322664121, "loss": 0.063, "step": 67850 }, { "epoch": 1.7, "learning_rate": 0.0004426550762505339, "loss": 0.0631, "step": 67860 }, { "epoch": 1.71, "learning_rate": 0.0004422782202346557, "loss": 0.0687, "step": 67870 }, { "epoch": 1.71, "learning_rate": 0.0004419013642187775, "loss": 0.0646, "step": 67880 }, { "epoch": 1.71, "learning_rate": 0.0004415245082028993, "loss": 0.0644, "step": 67890 }, { "epoch": 1.71, "learning_rate": 0.0004411476521870211, "loss": 0.0619, "step": 67900 }, { "epoch": 1.71, "learning_rate": 0.0004407707961711429, "loss": 0.0628, "step": 67910 }, { "epoch": 1.71, "learning_rate": 0.0004403939401552647, "loss": 0.0617, "step": 67920 }, { "epoch": 1.71, "learning_rate": 0.0004400170841393865, "loss": 0.065, "step": 67930 }, { "epoch": 1.71, "learning_rate": 0.0004396402281235083, "loss": 0.0642, "step": 67940 }, { "epoch": 1.71, "learning_rate": 0.0004392633721076301, "loss": 0.0633, "step": 67950 }, { "epoch": 1.71, "learning_rate": 0.00043888651609175195, "loss": 0.063, "step": 67960 }, { "epoch": 1.71, "learning_rate": 0.00043850966007587364, "loss": 0.0654, "step": 67970 }, { "epoch": 1.71, "learning_rate": 0.00043813280405999544, "loss": 0.0636, "step": 67980 }, { "epoch": 1.71, "learning_rate": 0.00043775594804411724, "loss": 0.0649, "step": 67990 }, { "epoch": 1.71, "learning_rate": 0.00043737909202823903, "loss": 0.0658, "step": 68000 }, { "epoch": 1.71, "eval_cer": 0.6652422248818218, "eval_loss": 0.05499656870961189, "eval_runtime": 90.5701, "eval_samples_per_second": 110.401, "eval_steps_per_second": 6.901, "step": 68000 }, { "epoch": 1.71, "learning_rate": 0.00043700223601236083, "loss": 0.0656, "step": 68010 }, { "epoch": 1.71, "learning_rate": 0.0004366253799964827, "loss": 0.0626, "step": 68020 }, { "epoch": 1.71, "learning_rate": 0.0004362485239806045, "loss": 0.0635, "step": 68030 }, { "epoch": 1.71, "learning_rate": 0.0004358716679647263, "loss": 0.0634, "step": 68040 }, { "epoch": 1.71, "learning_rate": 0.0004354948119488481, "loss": 0.0625, "step": 68050 }, { "epoch": 1.71, "learning_rate": 0.0004351179559329699, "loss": 0.0659, "step": 68060 }, { "epoch": 1.71, "learning_rate": 0.0004347410999170917, "loss": 0.0648, "step": 68070 }, { "epoch": 1.71, "learning_rate": 0.0004343642439012135, "loss": 0.0658, "step": 68080 }, { "epoch": 1.71, "learning_rate": 0.0004339873878853353, "loss": 0.0642, "step": 68090 }, { "epoch": 1.71, "learning_rate": 0.0004336105318694571, "loss": 0.0599, "step": 68100 }, { "epoch": 1.71, "learning_rate": 0.0004332336758535789, "loss": 0.063, "step": 68110 }, { "epoch": 1.71, "learning_rate": 0.0004328568198377007, "loss": 0.0649, "step": 68120 }, { "epoch": 1.71, "learning_rate": 0.00043247996382182253, "loss": 0.0663, "step": 68130 }, { "epoch": 1.71, "learning_rate": 0.0004321031078059443, "loss": 0.0652, "step": 68140 }, { "epoch": 1.71, "learning_rate": 0.0004317262517900661, "loss": 0.0635, "step": 68150 }, { "epoch": 1.71, "learning_rate": 0.0004313493957741879, "loss": 0.0666, "step": 68160 }, { "epoch": 1.71, "learning_rate": 0.0004309725397583097, "loss": 0.0679, "step": 68170 }, { "epoch": 1.71, "learning_rate": 0.0004305956837424315, "loss": 0.0618, "step": 68180 }, { "epoch": 1.71, "learning_rate": 0.0004302188277265533, "loss": 0.0659, "step": 68190 }, { "epoch": 1.71, "learning_rate": 0.00042984197171067507, "loss": 0.0622, "step": 68200 }, { "epoch": 1.71, "learning_rate": 0.00042946511569479686, "loss": 0.0654, "step": 68210 }, { "epoch": 1.71, "learning_rate": 0.00042908825967891866, "loss": 0.0605, "step": 68220 }, { "epoch": 1.71, "learning_rate": 0.00042871140366304046, "loss": 0.0613, "step": 68230 }, { "epoch": 1.71, "learning_rate": 0.00042833454764716226, "loss": 0.0616, "step": 68240 }, { "epoch": 1.71, "learning_rate": 0.00042795769163128406, "loss": 0.0642, "step": 68250 }, { "epoch": 1.71, "learning_rate": 0.00042758083561540586, "loss": 0.0647, "step": 68260 }, { "epoch": 1.72, "learning_rate": 0.00042720397959952766, "loss": 0.0618, "step": 68270 }, { "epoch": 1.72, "learning_rate": 0.00042682712358364946, "loss": 0.0622, "step": 68280 }, { "epoch": 1.72, "learning_rate": 0.00042645026756777125, "loss": 0.0674, "step": 68290 }, { "epoch": 1.72, "learning_rate": 0.00042607341155189305, "loss": 0.0645, "step": 68300 }, { "epoch": 1.72, "learning_rate": 0.0004256965555360149, "loss": 0.0643, "step": 68310 }, { "epoch": 1.72, "learning_rate": 0.0004253196995201367, "loss": 0.0659, "step": 68320 }, { "epoch": 1.72, "learning_rate": 0.0004249428435042585, "loss": 0.0641, "step": 68330 }, { "epoch": 1.72, "learning_rate": 0.0004245659874883803, "loss": 0.0638, "step": 68340 }, { "epoch": 1.72, "learning_rate": 0.0004241891314725021, "loss": 0.0638, "step": 68350 }, { "epoch": 1.72, "learning_rate": 0.0004238122754566239, "loss": 0.0624, "step": 68360 }, { "epoch": 1.72, "learning_rate": 0.0004234354194407457, "loss": 0.064, "step": 68370 }, { "epoch": 1.72, "learning_rate": 0.0004230585634248675, "loss": 0.0614, "step": 68380 }, { "epoch": 1.72, "learning_rate": 0.0004226817074089893, "loss": 0.0629, "step": 68390 }, { "epoch": 1.72, "learning_rate": 0.0004223048513931111, "loss": 0.065, "step": 68400 }, { "epoch": 1.72, "learning_rate": 0.0004219279953772329, "loss": 0.0652, "step": 68410 }, { "epoch": 1.72, "learning_rate": 0.00042155113936135464, "loss": 0.0619, "step": 68420 }, { "epoch": 1.72, "learning_rate": 0.00042117428334547644, "loss": 0.0639, "step": 68430 }, { "epoch": 1.72, "learning_rate": 0.00042079742732959824, "loss": 0.0622, "step": 68440 }, { "epoch": 1.72, "learning_rate": 0.00042042057131372004, "loss": 0.0649, "step": 68450 }, { "epoch": 1.72, "learning_rate": 0.00042004371529784184, "loss": 0.0617, "step": 68460 }, { "epoch": 1.72, "learning_rate": 0.00041966685928196363, "loss": 0.0616, "step": 68470 }, { "epoch": 1.72, "learning_rate": 0.0004192900032660855, "loss": 0.0656, "step": 68480 }, { "epoch": 1.72, "learning_rate": 0.0004189131472502073, "loss": 0.0644, "step": 68490 }, { "epoch": 1.72, "learning_rate": 0.0004185362912343291, "loss": 0.0654, "step": 68500 }, { "epoch": 1.72, "eval_cer": 0.6652802420781065, "eval_loss": 0.05473272502422333, "eval_runtime": 90.6389, "eval_samples_per_second": 110.317, "eval_steps_per_second": 6.895, "step": 68500 }, { "epoch": 1.72, "learning_rate": 0.0004181594352184509, "loss": 0.0607, "step": 68510 }, { "epoch": 1.72, "learning_rate": 0.0004177825792025727, "loss": 0.0648, "step": 68520 }, { "epoch": 1.72, "learning_rate": 0.0004174057231866945, "loss": 0.0613, "step": 68530 }, { "epoch": 1.72, "learning_rate": 0.0004170288671708163, "loss": 0.0652, "step": 68540 }, { "epoch": 1.72, "learning_rate": 0.0004166520111549381, "loss": 0.0624, "step": 68550 }, { "epoch": 1.72, "learning_rate": 0.0004162751551390599, "loss": 0.0648, "step": 68560 }, { "epoch": 1.72, "learning_rate": 0.0004158982991231817, "loss": 0.0624, "step": 68570 }, { "epoch": 1.72, "learning_rate": 0.0004155214431073035, "loss": 0.0628, "step": 68580 }, { "epoch": 1.72, "learning_rate": 0.00041514458709142533, "loss": 0.0655, "step": 68590 }, { "epoch": 1.72, "learning_rate": 0.00041476773107554713, "loss": 0.0661, "step": 68600 }, { "epoch": 1.72, "learning_rate": 0.0004143908750596689, "loss": 0.0627, "step": 68610 }, { "epoch": 1.72, "learning_rate": 0.0004140140190437907, "loss": 0.063, "step": 68620 }, { "epoch": 1.72, "learning_rate": 0.0004136371630279125, "loss": 0.0662, "step": 68630 }, { "epoch": 1.72, "learning_rate": 0.0004132603070120342, "loss": 0.0645, "step": 68640 }, { "epoch": 1.72, "learning_rate": 0.00041288345099615607, "loss": 0.062, "step": 68650 }, { "epoch": 1.72, "learning_rate": 0.00041250659498027787, "loss": 0.0633, "step": 68660 }, { "epoch": 1.73, "learning_rate": 0.00041212973896439966, "loss": 0.0664, "step": 68670 }, { "epoch": 1.73, "learning_rate": 0.00041175288294852146, "loss": 0.0625, "step": 68680 }, { "epoch": 1.73, "learning_rate": 0.00041137602693264326, "loss": 0.0637, "step": 68690 }, { "epoch": 1.73, "learning_rate": 0.00041099917091676506, "loss": 0.0653, "step": 68700 }, { "epoch": 1.73, "learning_rate": 0.00041062231490088686, "loss": 0.0622, "step": 68710 }, { "epoch": 1.73, "learning_rate": 0.00041024545888500866, "loss": 0.0637, "step": 68720 }, { "epoch": 1.73, "learning_rate": 0.00040986860286913046, "loss": 0.0634, "step": 68730 }, { "epoch": 1.73, "learning_rate": 0.00040949174685325226, "loss": 0.0658, "step": 68740 }, { "epoch": 1.73, "learning_rate": 0.00040911489083737406, "loss": 0.0646, "step": 68750 }, { "epoch": 1.73, "learning_rate": 0.00040873803482149585, "loss": 0.0644, "step": 68760 }, { "epoch": 1.73, "learning_rate": 0.0004083611788056177, "loss": 0.064, "step": 68770 }, { "epoch": 1.73, "learning_rate": 0.0004079843227897395, "loss": 0.0608, "step": 68780 }, { "epoch": 1.73, "learning_rate": 0.0004076074667738613, "loss": 0.0658, "step": 68790 }, { "epoch": 1.73, "learning_rate": 0.0004072306107579831, "loss": 0.0641, "step": 68800 }, { "epoch": 1.73, "learning_rate": 0.0004068537547421049, "loss": 0.0634, "step": 68810 }, { "epoch": 1.73, "learning_rate": 0.0004064768987262267, "loss": 0.0649, "step": 68820 }, { "epoch": 1.73, "learning_rate": 0.0004061000427103485, "loss": 0.0632, "step": 68830 }, { "epoch": 1.73, "learning_rate": 0.0004057231866944703, "loss": 0.0661, "step": 68840 }, { "epoch": 1.73, "learning_rate": 0.0004053463306785921, "loss": 0.065, "step": 68850 }, { "epoch": 1.73, "learning_rate": 0.00040496947466271384, "loss": 0.0658, "step": 68860 }, { "epoch": 1.73, "learning_rate": 0.00040459261864683564, "loss": 0.0654, "step": 68870 }, { "epoch": 1.73, "learning_rate": 0.00040421576263095744, "loss": 0.0607, "step": 68880 }, { "epoch": 1.73, "learning_rate": 0.00040383890661507924, "loss": 0.0647, "step": 68890 }, { "epoch": 1.73, "learning_rate": 0.00040346205059920104, "loss": 0.0608, "step": 68900 }, { "epoch": 1.73, "learning_rate": 0.00040308519458332284, "loss": 0.0642, "step": 68910 }, { "epoch": 1.73, "learning_rate": 0.00040270833856744464, "loss": 0.0664, "step": 68920 }, { "epoch": 1.73, "learning_rate": 0.00040233148255156643, "loss": 0.063, "step": 68930 }, { "epoch": 1.73, "learning_rate": 0.0004019546265356883, "loss": 0.0614, "step": 68940 }, { "epoch": 1.73, "learning_rate": 0.0004015777705198101, "loss": 0.0619, "step": 68950 }, { "epoch": 1.73, "learning_rate": 0.0004012009145039319, "loss": 0.064, "step": 68960 }, { "epoch": 1.73, "learning_rate": 0.0004008240584880537, "loss": 0.061, "step": 68970 }, { "epoch": 1.73, "learning_rate": 0.0004004472024721755, "loss": 0.0616, "step": 68980 }, { "epoch": 1.73, "learning_rate": 0.0004000703464562973, "loss": 0.0635, "step": 68990 }, { "epoch": 1.73, "learning_rate": 0.0003996934904404191, "loss": 0.0648, "step": 69000 }, { "epoch": 1.73, "eval_cer": 0.6652388562694929, "eval_loss": 0.05441926792263985, "eval_runtime": 90.7649, "eval_samples_per_second": 110.164, "eval_steps_per_second": 6.886, "step": 69000 }, { "epoch": 1.73, "learning_rate": 0.0003993166344245409, "loss": 0.0631, "step": 69010 }, { "epoch": 1.73, "learning_rate": 0.0003989397784086627, "loss": 0.061, "step": 69020 }, { "epoch": 1.73, "learning_rate": 0.0003985629223927845, "loss": 0.0661, "step": 69030 }, { "epoch": 1.73, "learning_rate": 0.0003981860663769063, "loss": 0.068, "step": 69040 }, { "epoch": 1.73, "learning_rate": 0.0003978092103610281, "loss": 0.0634, "step": 69050 }, { "epoch": 1.74, "learning_rate": 0.00039743235434514993, "loss": 0.0636, "step": 69060 }, { "epoch": 1.74, "learning_rate": 0.0003970554983292717, "loss": 0.0637, "step": 69070 }, { "epoch": 1.74, "learning_rate": 0.0003966786423133935, "loss": 0.0637, "step": 69080 }, { "epoch": 1.74, "learning_rate": 0.0003963017862975152, "loss": 0.0616, "step": 69090 }, { "epoch": 1.74, "learning_rate": 0.000395924930281637, "loss": 0.0616, "step": 69100 }, { "epoch": 1.74, "learning_rate": 0.0003955480742657588, "loss": 0.0612, "step": 69110 }, { "epoch": 1.74, "learning_rate": 0.00039517121824988067, "loss": 0.0644, "step": 69120 }, { "epoch": 1.74, "learning_rate": 0.00039479436223400247, "loss": 0.0623, "step": 69130 }, { "epoch": 1.74, "learning_rate": 0.00039441750621812426, "loss": 0.0671, "step": 69140 }, { "epoch": 1.74, "learning_rate": 0.00039404065020224606, "loss": 0.0638, "step": 69150 }, { "epoch": 1.74, "learning_rate": 0.00039366379418636786, "loss": 0.0653, "step": 69160 }, { "epoch": 1.74, "learning_rate": 0.00039328693817048966, "loss": 0.0618, "step": 69170 }, { "epoch": 1.74, "learning_rate": 0.00039291008215461146, "loss": 0.0682, "step": 69180 }, { "epoch": 1.74, "learning_rate": 0.00039253322613873326, "loss": 0.066, "step": 69190 }, { "epoch": 1.74, "learning_rate": 0.00039215637012285506, "loss": 0.0612, "step": 69200 }, { "epoch": 1.74, "learning_rate": 0.00039177951410697686, "loss": 0.0609, "step": 69210 }, { "epoch": 1.74, "learning_rate": 0.00039140265809109866, "loss": 0.0658, "step": 69220 }, { "epoch": 1.74, "learning_rate": 0.0003910258020752205, "loss": 0.0637, "step": 69230 }, { "epoch": 1.74, "learning_rate": 0.0003906489460593423, "loss": 0.0654, "step": 69240 }, { "epoch": 1.74, "learning_rate": 0.0003902720900434641, "loss": 0.0591, "step": 69250 }, { "epoch": 1.74, "learning_rate": 0.0003898952340275859, "loss": 0.067, "step": 69260 }, { "epoch": 1.74, "learning_rate": 0.0003895183780117077, "loss": 0.0627, "step": 69270 }, { "epoch": 1.74, "learning_rate": 0.0003891415219958295, "loss": 0.064, "step": 69280 }, { "epoch": 1.74, "learning_rate": 0.0003887646659799513, "loss": 0.0615, "step": 69290 }, { "epoch": 1.74, "learning_rate": 0.0003883878099640731, "loss": 0.0631, "step": 69300 }, { "epoch": 1.74, "learning_rate": 0.00038801095394819484, "loss": 0.0646, "step": 69310 }, { "epoch": 1.74, "learning_rate": 0.00038763409793231664, "loss": 0.0618, "step": 69320 }, { "epoch": 1.74, "learning_rate": 0.00038725724191643844, "loss": 0.0627, "step": 69330 }, { "epoch": 1.74, "learning_rate": 0.00038688038590056024, "loss": 0.0637, "step": 69340 }, { "epoch": 1.74, "learning_rate": 0.00038650352988468204, "loss": 0.066, "step": 69350 }, { "epoch": 1.74, "learning_rate": 0.00038612667386880384, "loss": 0.0635, "step": 69360 }, { "epoch": 1.74, "learning_rate": 0.00038574981785292564, "loss": 0.0645, "step": 69370 }, { "epoch": 1.74, "learning_rate": 0.00038537296183704744, "loss": 0.0632, "step": 69380 }, { "epoch": 1.74, "learning_rate": 0.00038499610582116924, "loss": 0.0679, "step": 69390 }, { "epoch": 1.74, "learning_rate": 0.00038461924980529103, "loss": 0.0631, "step": 69400 }, { "epoch": 1.74, "learning_rate": 0.0003842423937894129, "loss": 0.0632, "step": 69410 }, { "epoch": 1.74, "learning_rate": 0.0003838655377735347, "loss": 0.0607, "step": 69420 }, { "epoch": 1.74, "learning_rate": 0.0003834886817576565, "loss": 0.061, "step": 69430 }, { "epoch": 1.74, "learning_rate": 0.0003831118257417783, "loss": 0.0644, "step": 69440 }, { "epoch": 1.74, "learning_rate": 0.0003827349697259001, "loss": 0.0632, "step": 69450 }, { "epoch": 1.75, "learning_rate": 0.0003823581137100219, "loss": 0.0652, "step": 69460 }, { "epoch": 1.75, "learning_rate": 0.0003819812576941437, "loss": 0.0638, "step": 69470 }, { "epoch": 1.75, "learning_rate": 0.0003816044016782655, "loss": 0.0644, "step": 69480 }, { "epoch": 1.75, "learning_rate": 0.0003812275456623873, "loss": 0.0632, "step": 69490 }, { "epoch": 1.75, "learning_rate": 0.0003808506896465091, "loss": 0.0634, "step": 69500 }, { "epoch": 1.75, "eval_cer": 0.6652205695168496, "eval_loss": 0.05466347932815552, "eval_runtime": 90.7872, "eval_samples_per_second": 110.137, "eval_steps_per_second": 6.884, "step": 69500 }, { "epoch": 1.75, "learning_rate": 0.0003804738336306309, "loss": 0.0635, "step": 69510 }, { "epoch": 1.75, "learning_rate": 0.00038009697761475273, "loss": 0.0631, "step": 69520 }, { "epoch": 1.75, "learning_rate": 0.0003797201215988744, "loss": 0.0653, "step": 69530 }, { "epoch": 1.75, "learning_rate": 0.0003793432655829962, "loss": 0.0644, "step": 69540 }, { "epoch": 1.75, "learning_rate": 0.000378966409567118, "loss": 0.0607, "step": 69550 }, { "epoch": 1.75, "learning_rate": 0.0003785895535512398, "loss": 0.0663, "step": 69560 }, { "epoch": 1.75, "learning_rate": 0.0003782126975353616, "loss": 0.0646, "step": 69570 }, { "epoch": 1.75, "learning_rate": 0.00037783584151948347, "loss": 0.0633, "step": 69580 }, { "epoch": 1.75, "learning_rate": 0.00037745898550360527, "loss": 0.064, "step": 69590 }, { "epoch": 1.75, "learning_rate": 0.00037708212948772707, "loss": 0.0619, "step": 69600 }, { "epoch": 1.75, "learning_rate": 0.00037670527347184886, "loss": 0.06, "step": 69610 }, { "epoch": 1.75, "learning_rate": 0.00037632841745597066, "loss": 0.0627, "step": 69620 }, { "epoch": 1.75, "learning_rate": 0.00037595156144009246, "loss": 0.0618, "step": 69630 }, { "epoch": 1.75, "learning_rate": 0.00037557470542421426, "loss": 0.0643, "step": 69640 }, { "epoch": 1.75, "learning_rate": 0.00037519784940833606, "loss": 0.0647, "step": 69650 }, { "epoch": 1.75, "learning_rate": 0.00037482099339245786, "loss": 0.0622, "step": 69660 }, { "epoch": 1.75, "learning_rate": 0.00037444413737657966, "loss": 0.0646, "step": 69670 }, { "epoch": 1.75, "learning_rate": 0.00037406728136070146, "loss": 0.0632, "step": 69680 }, { "epoch": 1.75, "learning_rate": 0.00037369042534482325, "loss": 0.0615, "step": 69690 }, { "epoch": 1.75, "learning_rate": 0.00037331356932894505, "loss": 0.0654, "step": 69700 }, { "epoch": 1.75, "learning_rate": 0.00037293671331306685, "loss": 0.0621, "step": 69710 }, { "epoch": 1.75, "learning_rate": 0.00037255985729718865, "loss": 0.0611, "step": 69720 }, { "epoch": 1.75, "learning_rate": 0.00037218300128131045, "loss": 0.0651, "step": 69730 }, { "epoch": 1.75, "learning_rate": 0.00037180614526543225, "loss": 0.0624, "step": 69740 }, { "epoch": 1.75, "learning_rate": 0.00037142928924955405, "loss": 0.0651, "step": 69750 }, { "epoch": 1.75, "learning_rate": 0.00037105243323367585, "loss": 0.0625, "step": 69760 }, { "epoch": 1.75, "learning_rate": 0.00037067557721779765, "loss": 0.0627, "step": 69770 }, { "epoch": 1.75, "learning_rate": 0.0003702987212019195, "loss": 0.0657, "step": 69780 }, { "epoch": 1.75, "learning_rate": 0.0003699218651860413, "loss": 0.0654, "step": 69790 }, { "epoch": 1.75, "learning_rate": 0.0003695450091701631, "loss": 0.0615, "step": 69800 }, { "epoch": 1.75, "learning_rate": 0.00036916815315428484, "loss": 0.0639, "step": 69810 }, { "epoch": 1.75, "learning_rate": 0.00036879129713840664, "loss": 0.0629, "step": 69820 }, { "epoch": 1.75, "learning_rate": 0.00036841444112252844, "loss": 0.0632, "step": 69830 }, { "epoch": 1.75, "learning_rate": 0.00036803758510665024, "loss": 0.0595, "step": 69840 }, { "epoch": 1.75, "learning_rate": 0.00036766072909077204, "loss": 0.0634, "step": 69850 }, { "epoch": 1.76, "learning_rate": 0.00036728387307489383, "loss": 0.0647, "step": 69860 }, { "epoch": 1.76, "learning_rate": 0.0003669070170590157, "loss": 0.0643, "step": 69870 }, { "epoch": 1.76, "learning_rate": 0.0003665301610431375, "loss": 0.0602, "step": 69880 }, { "epoch": 1.76, "learning_rate": 0.0003661533050272593, "loss": 0.065, "step": 69890 }, { "epoch": 1.76, "learning_rate": 0.0003657764490113811, "loss": 0.0646, "step": 69900 }, { "epoch": 1.76, "learning_rate": 0.0003653995929955029, "loss": 0.0644, "step": 69910 }, { "epoch": 1.76, "learning_rate": 0.00036502273697962463, "loss": 0.0673, "step": 69920 }, { "epoch": 1.76, "learning_rate": 0.0003646458809637464, "loss": 0.0615, "step": 69930 }, { "epoch": 1.76, "learning_rate": 0.0003642690249478682, "loss": 0.0612, "step": 69940 }, { "epoch": 1.76, "learning_rate": 0.00036389216893199, "loss": 0.0609, "step": 69950 }, { "epoch": 1.76, "learning_rate": 0.0003635153129161119, "loss": 0.0653, "step": 69960 }, { "epoch": 1.76, "learning_rate": 0.0003631384569002337, "loss": 0.0605, "step": 69970 }, { "epoch": 1.76, "learning_rate": 0.0003627616008843555, "loss": 0.064, "step": 69980 }, { "epoch": 1.76, "learning_rate": 0.0003623847448684773, "loss": 0.0625, "step": 69990 }, { "epoch": 1.76, "learning_rate": 0.00036200788885259907, "loss": 0.0642, "step": 70000 }, { "epoch": 1.76, "eval_cer": 0.6653692696896594, "eval_loss": 0.054389722645282745, "eval_runtime": 90.734, "eval_samples_per_second": 110.201, "eval_steps_per_second": 6.888, "step": 70000 }, { "epoch": 1.76, "learning_rate": 0.00036163103283672087, "loss": 0.0622, "step": 70010 }, { "epoch": 1.76, "learning_rate": 0.00036125417682084267, "loss": 0.0612, "step": 70020 }, { "epoch": 1.76, "learning_rate": 0.0003608773208049644, "loss": 0.0615, "step": 70030 }, { "epoch": 1.76, "learning_rate": 0.0003605004647890862, "loss": 0.0621, "step": 70040 }, { "epoch": 1.76, "learning_rate": 0.00036012360877320807, "loss": 0.0629, "step": 70050 }, { "epoch": 1.76, "learning_rate": 0.00035974675275732987, "loss": 0.0632, "step": 70060 }, { "epoch": 1.76, "learning_rate": 0.00035936989674145166, "loss": 0.0636, "step": 70070 }, { "epoch": 1.76, "learning_rate": 0.00035899304072557346, "loss": 0.0664, "step": 70080 }, { "epoch": 1.76, "learning_rate": 0.00035861618470969526, "loss": 0.0626, "step": 70090 }, { "epoch": 1.76, "learning_rate": 0.00035823932869381706, "loss": 0.0607, "step": 70100 }, { "epoch": 1.76, "learning_rate": 0.00035786247267793886, "loss": 0.0632, "step": 70110 }, { "epoch": 1.76, "learning_rate": 0.00035748561666206066, "loss": 0.0652, "step": 70120 }, { "epoch": 1.76, "learning_rate": 0.00035710876064618246, "loss": 0.0649, "step": 70130 }, { "epoch": 1.76, "learning_rate": 0.00035673190463030426, "loss": 0.0622, "step": 70140 }, { "epoch": 1.76, "learning_rate": 0.00035635504861442606, "loss": 0.0669, "step": 70150 }, { "epoch": 1.76, "learning_rate": 0.00035597819259854785, "loss": 0.0627, "step": 70160 }, { "epoch": 1.76, "learning_rate": 0.00035560133658266965, "loss": 0.0651, "step": 70170 }, { "epoch": 1.76, "learning_rate": 0.00035522448056679145, "loss": 0.0624, "step": 70180 }, { "epoch": 1.76, "learning_rate": 0.00035484762455091325, "loss": 0.0621, "step": 70190 }, { "epoch": 1.76, "learning_rate": 0.00035447076853503505, "loss": 0.0648, "step": 70200 }, { "epoch": 1.76, "learning_rate": 0.00035409391251915685, "loss": 0.0621, "step": 70210 }, { "epoch": 1.76, "learning_rate": 0.00035371705650327865, "loss": 0.0623, "step": 70220 }, { "epoch": 1.76, "learning_rate": 0.00035334020048740045, "loss": 0.0631, "step": 70230 }, { "epoch": 1.76, "learning_rate": 0.00035296334447152224, "loss": 0.0619, "step": 70240 }, { "epoch": 1.76, "learning_rate": 0.0003525864884556441, "loss": 0.0611, "step": 70250 }, { "epoch": 1.77, "learning_rate": 0.00035220963243976584, "loss": 0.0656, "step": 70260 }, { "epoch": 1.77, "learning_rate": 0.00035183277642388764, "loss": 0.0644, "step": 70270 }, { "epoch": 1.77, "learning_rate": 0.00035145592040800944, "loss": 0.0662, "step": 70280 }, { "epoch": 1.77, "learning_rate": 0.00035107906439213124, "loss": 0.0625, "step": 70290 }, { "epoch": 1.77, "learning_rate": 0.00035070220837625304, "loss": 0.0634, "step": 70300 }, { "epoch": 1.77, "learning_rate": 0.00035032535236037484, "loss": 0.0604, "step": 70310 }, { "epoch": 1.77, "learning_rate": 0.00034994849634449664, "loss": 0.0602, "step": 70320 }, { "epoch": 1.77, "learning_rate": 0.0003495716403286185, "loss": 0.0634, "step": 70330 }, { "epoch": 1.77, "learning_rate": 0.0003491947843127403, "loss": 0.0613, "step": 70340 }, { "epoch": 1.77, "learning_rate": 0.0003488179282968621, "loss": 0.0648, "step": 70350 }, { "epoch": 1.77, "learning_rate": 0.0003484410722809839, "loss": 0.0603, "step": 70360 }, { "epoch": 1.77, "learning_rate": 0.00034806421626510563, "loss": 0.0621, "step": 70370 }, { "epoch": 1.77, "learning_rate": 0.00034768736024922743, "loss": 0.0659, "step": 70380 }, { "epoch": 1.77, "learning_rate": 0.00034731050423334923, "loss": 0.0619, "step": 70390 }, { "epoch": 1.77, "learning_rate": 0.000346933648217471, "loss": 0.0652, "step": 70400 }, { "epoch": 1.77, "learning_rate": 0.0003465567922015928, "loss": 0.0612, "step": 70410 }, { "epoch": 1.77, "learning_rate": 0.0003461799361857147, "loss": 0.0631, "step": 70420 }, { "epoch": 1.77, "learning_rate": 0.0003458030801698365, "loss": 0.0613, "step": 70430 }, { "epoch": 1.77, "learning_rate": 0.0003454262241539583, "loss": 0.0624, "step": 70440 }, { "epoch": 1.77, "learning_rate": 0.0003450493681380801, "loss": 0.0639, "step": 70450 }, { "epoch": 1.77, "learning_rate": 0.0003446725121222019, "loss": 0.0672, "step": 70460 }, { "epoch": 1.77, "learning_rate": 0.00034429565610632367, "loss": 0.0618, "step": 70470 }, { "epoch": 1.77, "learning_rate": 0.0003439188000904454, "loss": 0.0622, "step": 70480 }, { "epoch": 1.77, "learning_rate": 0.0003435419440745672, "loss": 0.0607, "step": 70490 }, { "epoch": 1.77, "learning_rate": 0.000343165088058689, "loss": 0.0649, "step": 70500 }, { "epoch": 1.77, "eval_cer": 0.66524366857282, "eval_loss": 0.054241545498371124, "eval_runtime": 90.7441, "eval_samples_per_second": 110.189, "eval_steps_per_second": 6.887, "step": 70500 }, { "epoch": 1.77, "learning_rate": 0.00034278823204281087, "loss": 0.0606, "step": 70510 }, { "epoch": 1.77, "learning_rate": 0.00034241137602693267, "loss": 0.0609, "step": 70520 }, { "epoch": 1.77, "learning_rate": 0.00034203452001105447, "loss": 0.0649, "step": 70530 }, { "epoch": 1.77, "learning_rate": 0.00034165766399517626, "loss": 0.0642, "step": 70540 }, { "epoch": 1.77, "learning_rate": 0.00034128080797929806, "loss": 0.0622, "step": 70550 }, { "epoch": 1.77, "learning_rate": 0.00034090395196341986, "loss": 0.065, "step": 70560 }, { "epoch": 1.77, "learning_rate": 0.00034052709594754166, "loss": 0.0619, "step": 70570 }, { "epoch": 1.77, "learning_rate": 0.00034015023993166346, "loss": 0.0651, "step": 70580 }, { "epoch": 1.77, "learning_rate": 0.0003397733839157852, "loss": 0.0682, "step": 70590 }, { "epoch": 1.77, "learning_rate": 0.00033939652789990706, "loss": 0.0646, "step": 70600 }, { "epoch": 1.77, "learning_rate": 0.00033901967188402886, "loss": 0.0616, "step": 70610 }, { "epoch": 1.77, "learning_rate": 0.00033864281586815065, "loss": 0.0637, "step": 70620 }, { "epoch": 1.77, "learning_rate": 0.00033826595985227245, "loss": 0.0624, "step": 70630 }, { "epoch": 1.77, "learning_rate": 0.00033788910383639425, "loss": 0.0632, "step": 70640 }, { "epoch": 1.77, "learning_rate": 0.00033751224782051605, "loss": 0.0624, "step": 70650 }, { "epoch": 1.78, "learning_rate": 0.00033713539180463785, "loss": 0.0621, "step": 70660 }, { "epoch": 1.78, "learning_rate": 0.00033675853578875965, "loss": 0.0638, "step": 70670 }, { "epoch": 1.78, "learning_rate": 0.00033638167977288145, "loss": 0.0678, "step": 70680 }, { "epoch": 1.78, "learning_rate": 0.00033600482375700325, "loss": 0.0651, "step": 70690 }, { "epoch": 1.78, "learning_rate": 0.00033562796774112505, "loss": 0.0675, "step": 70700 }, { "epoch": 1.78, "learning_rate": 0.00033525111172524684, "loss": 0.0615, "step": 70710 }, { "epoch": 1.78, "learning_rate": 0.00033487425570936864, "loss": 0.0636, "step": 70720 }, { "epoch": 1.78, "learning_rate": 0.00033449739969349044, "loss": 0.0627, "step": 70730 }, { "epoch": 1.78, "learning_rate": 0.00033412054367761224, "loss": 0.0677, "step": 70740 }, { "epoch": 1.78, "learning_rate": 0.00033374368766173404, "loss": 0.0682, "step": 70750 }, { "epoch": 1.78, "learning_rate": 0.00033336683164585584, "loss": 0.0618, "step": 70760 }, { "epoch": 1.78, "learning_rate": 0.00033298997562997764, "loss": 0.064, "step": 70770 }, { "epoch": 1.78, "learning_rate": 0.00033261311961409944, "loss": 0.0645, "step": 70780 }, { "epoch": 1.78, "learning_rate": 0.00033223626359822124, "loss": 0.0644, "step": 70790 }, { "epoch": 1.78, "learning_rate": 0.0003318594075823431, "loss": 0.0653, "step": 70800 }, { "epoch": 1.78, "learning_rate": 0.00033148255156646483, "loss": 0.0629, "step": 70810 }, { "epoch": 1.78, "learning_rate": 0.00033110569555058663, "loss": 0.0617, "step": 70820 }, { "epoch": 1.78, "learning_rate": 0.00033072883953470843, "loss": 0.062, "step": 70830 }, { "epoch": 1.78, "learning_rate": 0.00033035198351883023, "loss": 0.0629, "step": 70840 }, { "epoch": 1.78, "learning_rate": 0.00032997512750295203, "loss": 0.0628, "step": 70850 }, { "epoch": 1.78, "learning_rate": 0.0003295982714870738, "loss": 0.0653, "step": 70860 }, { "epoch": 1.78, "learning_rate": 0.0003292214154711956, "loss": 0.0627, "step": 70870 }, { "epoch": 1.78, "learning_rate": 0.0003288445594553175, "loss": 0.0641, "step": 70880 }, { "epoch": 1.78, "learning_rate": 0.0003284677034394393, "loss": 0.0656, "step": 70890 }, { "epoch": 1.78, "learning_rate": 0.0003280908474235611, "loss": 0.0652, "step": 70900 }, { "epoch": 1.78, "learning_rate": 0.0003277139914076829, "loss": 0.0614, "step": 70910 }, { "epoch": 1.78, "learning_rate": 0.0003273371353918046, "loss": 0.0635, "step": 70920 }, { "epoch": 1.78, "learning_rate": 0.0003269602793759264, "loss": 0.0615, "step": 70930 }, { "epoch": 1.78, "learning_rate": 0.0003265834233600482, "loss": 0.0628, "step": 70940 }, { "epoch": 1.78, "learning_rate": 0.00032620656734417, "loss": 0.0638, "step": 70950 }, { "epoch": 1.78, "learning_rate": 0.0003258297113282918, "loss": 0.0637, "step": 70960 }, { "epoch": 1.78, "learning_rate": 0.00032545285531241367, "loss": 0.0605, "step": 70970 }, { "epoch": 1.78, "learning_rate": 0.00032507599929653547, "loss": 0.0628, "step": 70980 }, { "epoch": 1.78, "learning_rate": 0.00032469914328065727, "loss": 0.0627, "step": 70990 }, { "epoch": 1.78, "learning_rate": 0.00032432228726477906, "loss": 0.0641, "step": 71000 }, { "epoch": 1.78, "eval_cer": 0.6652013203035408, "eval_loss": 0.053951624780893326, "eval_runtime": 90.7661, "eval_samples_per_second": 110.162, "eval_steps_per_second": 6.886, "step": 71000 }, { "epoch": 1.78, "learning_rate": 0.00032394543124890086, "loss": 0.0643, "step": 71010 }, { "epoch": 1.78, "learning_rate": 0.00032356857523302266, "loss": 0.0586, "step": 71020 }, { "epoch": 1.78, "learning_rate": 0.0003231917192171444, "loss": 0.0624, "step": 71030 }, { "epoch": 1.78, "learning_rate": 0.0003228148632012662, "loss": 0.0617, "step": 71040 }, { "epoch": 1.79, "learning_rate": 0.000322438007185388, "loss": 0.0641, "step": 71050 }, { "epoch": 1.79, "learning_rate": 0.00032206115116950986, "loss": 0.062, "step": 71060 }, { "epoch": 1.79, "learning_rate": 0.00032168429515363166, "loss": 0.0642, "step": 71070 }, { "epoch": 1.79, "learning_rate": 0.00032130743913775346, "loss": 0.0607, "step": 71080 }, { "epoch": 1.79, "learning_rate": 0.00032093058312187525, "loss": 0.0608, "step": 71090 }, { "epoch": 1.79, "learning_rate": 0.00032055372710599705, "loss": 0.0588, "step": 71100 }, { "epoch": 1.79, "learning_rate": 0.00032017687109011885, "loss": 0.0639, "step": 71110 }, { "epoch": 1.79, "learning_rate": 0.00031980001507424065, "loss": 0.0629, "step": 71120 }, { "epoch": 1.79, "learning_rate": 0.00031942315905836245, "loss": 0.0616, "step": 71130 }, { "epoch": 1.79, "learning_rate": 0.00031904630304248425, "loss": 0.0612, "step": 71140 }, { "epoch": 1.79, "learning_rate": 0.00031866944702660605, "loss": 0.0648, "step": 71150 }, { "epoch": 1.79, "learning_rate": 0.00031829259101072785, "loss": 0.0631, "step": 71160 }, { "epoch": 1.79, "learning_rate": 0.00031791573499484965, "loss": 0.0609, "step": 71170 }, { "epoch": 1.79, "learning_rate": 0.00031753887897897144, "loss": 0.0603, "step": 71180 }, { "epoch": 1.79, "learning_rate": 0.00031716202296309324, "loss": 0.0636, "step": 71190 }, { "epoch": 1.79, "learning_rate": 0.00031678516694721504, "loss": 0.0587, "step": 71200 }, { "epoch": 1.79, "learning_rate": 0.00031640831093133684, "loss": 0.0612, "step": 71210 }, { "epoch": 1.79, "learning_rate": 0.00031603145491545864, "loss": 0.0611, "step": 71220 }, { "epoch": 1.79, "learning_rate": 0.00031565459889958044, "loss": 0.063, "step": 71230 }, { "epoch": 1.79, "learning_rate": 0.00031527774288370224, "loss": 0.0617, "step": 71240 }, { "epoch": 1.79, "learning_rate": 0.00031490088686782404, "loss": 0.0621, "step": 71250 }, { "epoch": 1.79, "learning_rate": 0.00031452403085194583, "loss": 0.0598, "step": 71260 }, { "epoch": 1.79, "learning_rate": 0.00031414717483606763, "loss": 0.0627, "step": 71270 }, { "epoch": 1.79, "learning_rate": 0.00031377031882018943, "loss": 0.0653, "step": 71280 }, { "epoch": 1.79, "learning_rate": 0.00031339346280431123, "loss": 0.059, "step": 71290 }, { "epoch": 1.79, "learning_rate": 0.00031301660678843303, "loss": 0.0609, "step": 71300 }, { "epoch": 1.79, "learning_rate": 0.00031263975077255483, "loss": 0.0641, "step": 71310 }, { "epoch": 1.79, "learning_rate": 0.00031226289475667663, "loss": 0.0651, "step": 71320 }, { "epoch": 1.79, "learning_rate": 0.0003118860387407984, "loss": 0.063, "step": 71330 }, { "epoch": 1.79, "learning_rate": 0.0003115091827249202, "loss": 0.0604, "step": 71340 }, { "epoch": 1.79, "learning_rate": 0.0003111323267090421, "loss": 0.0629, "step": 71350 }, { "epoch": 1.79, "learning_rate": 0.0003107554706931639, "loss": 0.0601, "step": 71360 }, { "epoch": 1.79, "learning_rate": 0.0003103786146772856, "loss": 0.0604, "step": 71370 }, { "epoch": 1.79, "learning_rate": 0.0003100017586614074, "loss": 0.0625, "step": 71380 }, { "epoch": 1.79, "learning_rate": 0.0003096249026455292, "loss": 0.0602, "step": 71390 }, { "epoch": 1.79, "learning_rate": 0.000309248046629651, "loss": 0.064, "step": 71400 }, { "epoch": 1.79, "learning_rate": 0.0003088711906137728, "loss": 0.0646, "step": 71410 }, { "epoch": 1.79, "learning_rate": 0.0003084943345978946, "loss": 0.0625, "step": 71420 }, { "epoch": 1.79, "learning_rate": 0.0003081174785820164, "loss": 0.0599, "step": 71430 }, { "epoch": 1.79, "learning_rate": 0.00030774062256613827, "loss": 0.0649, "step": 71440 }, { "epoch": 1.8, "learning_rate": 0.00030736376655026007, "loss": 0.0652, "step": 71450 }, { "epoch": 1.8, "learning_rate": 0.00030698691053438187, "loss": 0.063, "step": 71460 }, { "epoch": 1.8, "learning_rate": 0.00030661005451850366, "loss": 0.0613, "step": 71470 }, { "epoch": 1.8, "learning_rate": 0.0003062331985026254, "loss": 0.0652, "step": 71480 }, { "epoch": 1.8, "learning_rate": 0.0003058563424867472, "loss": 0.062, "step": 71490 }, { "epoch": 1.8, "learning_rate": 0.000305479486470869, "loss": 0.0659, "step": 71500 }, { "epoch": 1.8, "eval_cer": 0.6653043035947425, "eval_loss": 0.05395006760954857, "eval_runtime": 90.8279, "eval_samples_per_second": 110.087, "eval_steps_per_second": 6.881, "step": 71500 }, { "epoch": 1.8, "learning_rate": 0.0003051026304549908, "loss": 0.0621, "step": 71510 }, { "epoch": 1.8, "learning_rate": 0.00030472577443911266, "loss": 0.059, "step": 71520 }, { "epoch": 1.8, "learning_rate": 0.00030434891842323446, "loss": 0.0615, "step": 71530 }, { "epoch": 1.8, "learning_rate": 0.00030397206240735626, "loss": 0.0614, "step": 71540 }, { "epoch": 1.8, "learning_rate": 0.00030359520639147806, "loss": 0.0612, "step": 71550 }, { "epoch": 1.8, "learning_rate": 0.00030321835037559985, "loss": 0.0659, "step": 71560 }, { "epoch": 1.8, "learning_rate": 0.00030284149435972165, "loss": 0.0637, "step": 71570 }, { "epoch": 1.8, "learning_rate": 0.00030246463834384345, "loss": 0.063, "step": 71580 }, { "epoch": 1.8, "learning_rate": 0.0003020877823279652, "loss": 0.0588, "step": 71590 }, { "epoch": 1.8, "learning_rate": 0.000301710926312087, "loss": 0.0634, "step": 71600 }, { "epoch": 1.8, "learning_rate": 0.00030133407029620885, "loss": 0.0591, "step": 71610 }, { "epoch": 1.8, "learning_rate": 0.00030095721428033065, "loss": 0.0631, "step": 71620 }, { "epoch": 1.8, "learning_rate": 0.00030058035826445245, "loss": 0.0608, "step": 71630 }, { "epoch": 1.8, "learning_rate": 0.00030020350224857424, "loss": 0.0653, "step": 71640 }, { "epoch": 1.8, "learning_rate": 0.00029982664623269604, "loss": 0.065, "step": 71650 }, { "epoch": 1.8, "learning_rate": 0.00029944979021681784, "loss": 0.0664, "step": 71660 }, { "epoch": 1.8, "learning_rate": 0.00029907293420093964, "loss": 0.064, "step": 71670 }, { "epoch": 1.8, "learning_rate": 0.00029869607818506144, "loss": 0.0653, "step": 71680 }, { "epoch": 1.8, "learning_rate": 0.00029831922216918324, "loss": 0.0609, "step": 71690 }, { "epoch": 1.8, "learning_rate": 0.00029794236615330504, "loss": 0.06, "step": 71700 }, { "epoch": 1.8, "learning_rate": 0.00029756551013742684, "loss": 0.0614, "step": 71710 }, { "epoch": 1.8, "learning_rate": 0.00029718865412154864, "loss": 0.0588, "step": 71720 }, { "epoch": 1.8, "learning_rate": 0.00029681179810567043, "loss": 0.0643, "step": 71730 }, { "epoch": 1.8, "learning_rate": 0.00029643494208979223, "loss": 0.0627, "step": 71740 }, { "epoch": 1.8, "learning_rate": 0.00029605808607391403, "loss": 0.0608, "step": 71750 }, { "epoch": 1.8, "learning_rate": 0.00029568123005803583, "loss": 0.0638, "step": 71760 }, { "epoch": 1.8, "learning_rate": 0.00029530437404215763, "loss": 0.063, "step": 71770 }, { "epoch": 1.8, "learning_rate": 0.00029492751802627943, "loss": 0.064, "step": 71780 }, { "epoch": 1.8, "learning_rate": 0.00029455066201040123, "loss": 0.0607, "step": 71790 }, { "epoch": 1.8, "learning_rate": 0.000294173805994523, "loss": 0.0645, "step": 71800 }, { "epoch": 1.8, "learning_rate": 0.0002937969499786448, "loss": 0.0607, "step": 71810 }, { "epoch": 1.8, "learning_rate": 0.0002934200939627666, "loss": 0.0641, "step": 71820 }, { "epoch": 1.8, "learning_rate": 0.0002930432379468884, "loss": 0.0632, "step": 71830 }, { "epoch": 1.8, "learning_rate": 0.0002926663819310102, "loss": 0.065, "step": 71840 }, { "epoch": 1.81, "learning_rate": 0.000292289525915132, "loss": 0.0644, "step": 71850 }, { "epoch": 1.81, "learning_rate": 0.0002919126698992538, "loss": 0.0651, "step": 71860 }, { "epoch": 1.81, "learning_rate": 0.0002915358138833756, "loss": 0.0606, "step": 71870 }, { "epoch": 1.81, "learning_rate": 0.0002911589578674974, "loss": 0.0585, "step": 71880 }, { "epoch": 1.81, "learning_rate": 0.0002907821018516192, "loss": 0.0641, "step": 71890 }, { "epoch": 1.81, "learning_rate": 0.00029040524583574107, "loss": 0.0615, "step": 71900 }, { "epoch": 1.81, "learning_rate": 0.00029002838981986287, "loss": 0.0648, "step": 71910 }, { "epoch": 1.81, "learning_rate": 0.0002896515338039846, "loss": 0.0629, "step": 71920 }, { "epoch": 1.81, "learning_rate": 0.0002892746777881064, "loss": 0.0605, "step": 71930 }, { "epoch": 1.81, "learning_rate": 0.0002888978217722282, "loss": 0.0626, "step": 71940 }, { "epoch": 1.81, "learning_rate": 0.00028852096575635, "loss": 0.0632, "step": 71950 }, { "epoch": 1.81, "learning_rate": 0.0002881441097404718, "loss": 0.0635, "step": 71960 }, { "epoch": 1.81, "learning_rate": 0.0002877672537245936, "loss": 0.0633, "step": 71970 }, { "epoch": 1.81, "learning_rate": 0.0002873903977087154, "loss": 0.0655, "step": 71980 }, { "epoch": 1.81, "learning_rate": 0.00028701354169283726, "loss": 0.0627, "step": 71990 }, { "epoch": 1.81, "learning_rate": 0.00028663668567695906, "loss": 0.0651, "step": 72000 }, { "epoch": 1.81, "eval_cer": 0.6652186445955187, "eval_loss": 0.053641460835933685, "eval_runtime": 90.6025, "eval_samples_per_second": 110.361, "eval_steps_per_second": 6.898, "step": 72000 }, { "epoch": 1.81, "learning_rate": 0.00028625982966108086, "loss": 0.0627, "step": 72010 }, { "epoch": 1.81, "learning_rate": 0.00028588297364520265, "loss": 0.0629, "step": 72020 }, { "epoch": 1.81, "learning_rate": 0.00028550611762932445, "loss": 0.0617, "step": 72030 }, { "epoch": 1.81, "learning_rate": 0.0002851292616134462, "loss": 0.0637, "step": 72040 }, { "epoch": 1.81, "learning_rate": 0.000284752405597568, "loss": 0.0618, "step": 72050 }, { "epoch": 1.81, "learning_rate": 0.0002843755495816898, "loss": 0.0641, "step": 72060 }, { "epoch": 1.81, "learning_rate": 0.00028399869356581165, "loss": 0.0624, "step": 72070 }, { "epoch": 1.81, "learning_rate": 0.00028362183754993345, "loss": 0.0617, "step": 72080 }, { "epoch": 1.81, "learning_rate": 0.00028324498153405525, "loss": 0.0627, "step": 72090 }, { "epoch": 1.81, "learning_rate": 0.00028286812551817705, "loss": 0.0636, "step": 72100 }, { "epoch": 1.81, "learning_rate": 0.00028249126950229884, "loss": 0.0631, "step": 72110 }, { "epoch": 1.81, "learning_rate": 0.00028211441348642064, "loss": 0.0613, "step": 72120 }, { "epoch": 1.81, "learning_rate": 0.00028173755747054244, "loss": 0.0608, "step": 72130 }, { "epoch": 1.81, "learning_rate": 0.00028136070145466424, "loss": 0.063, "step": 72140 }, { "epoch": 1.81, "learning_rate": 0.000280983845438786, "loss": 0.0623, "step": 72150 }, { "epoch": 1.81, "learning_rate": 0.00028060698942290784, "loss": 0.0613, "step": 72160 }, { "epoch": 1.81, "learning_rate": 0.00028023013340702964, "loss": 0.0598, "step": 72170 }, { "epoch": 1.81, "learning_rate": 0.00027985327739115144, "loss": 0.0657, "step": 72180 }, { "epoch": 1.81, "learning_rate": 0.00027947642137527323, "loss": 0.061, "step": 72190 }, { "epoch": 1.81, "learning_rate": 0.00027909956535939503, "loss": 0.0615, "step": 72200 }, { "epoch": 1.81, "learning_rate": 0.00027872270934351683, "loss": 0.0625, "step": 72210 }, { "epoch": 1.81, "learning_rate": 0.00027834585332763863, "loss": 0.0626, "step": 72220 }, { "epoch": 1.81, "learning_rate": 0.00027796899731176043, "loss": 0.0669, "step": 72230 }, { "epoch": 1.81, "learning_rate": 0.00027759214129588223, "loss": 0.0622, "step": 72240 }, { "epoch": 1.82, "learning_rate": 0.00027721528528000403, "loss": 0.0625, "step": 72250 }, { "epoch": 1.82, "learning_rate": 0.0002768384292641258, "loss": 0.0602, "step": 72260 }, { "epoch": 1.82, "learning_rate": 0.0002764615732482476, "loss": 0.0642, "step": 72270 }, { "epoch": 1.82, "learning_rate": 0.0002760847172323694, "loss": 0.0632, "step": 72280 }, { "epoch": 1.82, "learning_rate": 0.0002757078612164912, "loss": 0.0598, "step": 72290 }, { "epoch": 1.82, "learning_rate": 0.000275331005200613, "loss": 0.0613, "step": 72300 }, { "epoch": 1.82, "learning_rate": 0.0002749541491847348, "loss": 0.0633, "step": 72310 }, { "epoch": 1.82, "learning_rate": 0.0002745772931688566, "loss": 0.0616, "step": 72320 }, { "epoch": 1.82, "learning_rate": 0.0002742004371529784, "loss": 0.061, "step": 72330 }, { "epoch": 1.82, "learning_rate": 0.0002738235811371002, "loss": 0.0608, "step": 72340 }, { "epoch": 1.82, "learning_rate": 0.000273446725121222, "loss": 0.0611, "step": 72350 }, { "epoch": 1.82, "learning_rate": 0.00027306986910534387, "loss": 0.0646, "step": 72360 }, { "epoch": 1.82, "learning_rate": 0.0002726930130894656, "loss": 0.0621, "step": 72370 }, { "epoch": 1.82, "learning_rate": 0.0002723161570735874, "loss": 0.0633, "step": 72380 }, { "epoch": 1.82, "learning_rate": 0.0002719393010577092, "loss": 0.0626, "step": 72390 }, { "epoch": 1.82, "learning_rate": 0.000271562445041831, "loss": 0.0641, "step": 72400 }, { "epoch": 1.82, "learning_rate": 0.0002711855890259528, "loss": 0.0633, "step": 72410 }, { "epoch": 1.82, "learning_rate": 0.0002708087330100746, "loss": 0.062, "step": 72420 }, { "epoch": 1.82, "learning_rate": 0.0002704318769941964, "loss": 0.0646, "step": 72430 }, { "epoch": 1.82, "learning_rate": 0.0002700550209783182, "loss": 0.0604, "step": 72440 }, { "epoch": 1.82, "learning_rate": 0.00026967816496244006, "loss": 0.0631, "step": 72450 }, { "epoch": 1.82, "learning_rate": 0.00026930130894656186, "loss": 0.0602, "step": 72460 }, { "epoch": 1.82, "learning_rate": 0.00026892445293068366, "loss": 0.062, "step": 72470 }, { "epoch": 1.82, "learning_rate": 0.0002685475969148054, "loss": 0.0606, "step": 72480 }, { "epoch": 1.82, "learning_rate": 0.0002681707408989272, "loss": 0.0629, "step": 72490 }, { "epoch": 1.82, "learning_rate": 0.000267793884883049, "loss": 0.0625, "step": 72500 }, { "epoch": 1.82, "eval_cer": 0.6651657092589197, "eval_loss": 0.05356631428003311, "eval_runtime": 90.9229, "eval_samples_per_second": 109.972, "eval_steps_per_second": 6.874, "step": 72500 }, { "epoch": 1.82, "learning_rate": 0.0002674170288671708, "loss": 0.064, "step": 72510 }, { "epoch": 1.82, "learning_rate": 0.0002670401728512926, "loss": 0.0625, "step": 72520 }, { "epoch": 1.82, "learning_rate": 0.0002666633168354144, "loss": 0.0609, "step": 72530 }, { "epoch": 1.82, "learning_rate": 0.00026628646081953625, "loss": 0.0611, "step": 72540 }, { "epoch": 1.82, "learning_rate": 0.00026590960480365805, "loss": 0.0642, "step": 72550 }, { "epoch": 1.82, "learning_rate": 0.00026553274878777985, "loss": 0.0605, "step": 72560 }, { "epoch": 1.82, "learning_rate": 0.00026515589277190164, "loss": 0.0596, "step": 72570 }, { "epoch": 1.82, "learning_rate": 0.00026477903675602344, "loss": 0.0594, "step": 72580 }, { "epoch": 1.82, "learning_rate": 0.0002644021807401452, "loss": 0.0612, "step": 72590 }, { "epoch": 1.82, "learning_rate": 0.000264025324724267, "loss": 0.06, "step": 72600 }, { "epoch": 1.82, "learning_rate": 0.0002636484687083888, "loss": 0.0629, "step": 72610 }, { "epoch": 1.82, "learning_rate": 0.00026327161269251064, "loss": 0.062, "step": 72620 }, { "epoch": 1.82, "learning_rate": 0.00026289475667663244, "loss": 0.0625, "step": 72630 }, { "epoch": 1.82, "learning_rate": 0.00026251790066075424, "loss": 0.061, "step": 72640 }, { "epoch": 1.83, "learning_rate": 0.00026214104464487604, "loss": 0.0599, "step": 72650 }, { "epoch": 1.83, "learning_rate": 0.00026176418862899783, "loss": 0.0616, "step": 72660 }, { "epoch": 1.83, "learning_rate": 0.00026138733261311963, "loss": 0.0633, "step": 72670 }, { "epoch": 1.83, "learning_rate": 0.00026101047659724143, "loss": 0.0604, "step": 72680 }, { "epoch": 1.83, "learning_rate": 0.00026063362058136323, "loss": 0.0581, "step": 72690 }, { "epoch": 1.83, "learning_rate": 0.000260256764565485, "loss": 0.0636, "step": 72700 }, { "epoch": 1.83, "learning_rate": 0.00025987990854960683, "loss": 0.0613, "step": 72710 }, { "epoch": 1.83, "learning_rate": 0.00025950305253372863, "loss": 0.065, "step": 72720 }, { "epoch": 1.83, "learning_rate": 0.0002591261965178504, "loss": 0.0623, "step": 72730 }, { "epoch": 1.83, "learning_rate": 0.0002587493405019722, "loss": 0.0636, "step": 72740 }, { "epoch": 1.83, "learning_rate": 0.000258372484486094, "loss": 0.0666, "step": 72750 }, { "epoch": 1.83, "learning_rate": 0.0002579956284702158, "loss": 0.0629, "step": 72760 }, { "epoch": 1.83, "learning_rate": 0.0002576187724543376, "loss": 0.0617, "step": 72770 }, { "epoch": 1.83, "learning_rate": 0.0002572419164384594, "loss": 0.0617, "step": 72780 }, { "epoch": 1.83, "learning_rate": 0.0002568650604225812, "loss": 0.0678, "step": 72790 }, { "epoch": 1.83, "learning_rate": 0.000256488204406703, "loss": 0.0653, "step": 72800 }, { "epoch": 1.83, "learning_rate": 0.0002561113483908248, "loss": 0.063, "step": 72810 }, { "epoch": 1.83, "learning_rate": 0.0002557344923749466, "loss": 0.0597, "step": 72820 }, { "epoch": 1.83, "learning_rate": 0.0002553576363590684, "loss": 0.0646, "step": 72830 }, { "epoch": 1.83, "learning_rate": 0.0002549807803431902, "loss": 0.0633, "step": 72840 }, { "epoch": 1.83, "learning_rate": 0.000254603924327312, "loss": 0.0611, "step": 72850 }, { "epoch": 1.83, "learning_rate": 0.0002542270683114338, "loss": 0.058, "step": 72860 }, { "epoch": 1.83, "learning_rate": 0.0002538502122955556, "loss": 0.0618, "step": 72870 }, { "epoch": 1.83, "learning_rate": 0.0002534733562796774, "loss": 0.0654, "step": 72880 }, { "epoch": 1.83, "learning_rate": 0.0002530965002637992, "loss": 0.0609, "step": 72890 }, { "epoch": 1.83, "learning_rate": 0.000252719644247921, "loss": 0.0614, "step": 72900 }, { "epoch": 1.83, "learning_rate": 0.00025234278823204286, "loss": 0.0612, "step": 72910 }, { "epoch": 1.83, "learning_rate": 0.00025196593221616466, "loss": 0.0605, "step": 72920 }, { "epoch": 1.83, "learning_rate": 0.0002515890762002864, "loss": 0.0595, "step": 72930 }, { "epoch": 1.83, "learning_rate": 0.0002512122201844082, "loss": 0.0611, "step": 72940 }, { "epoch": 1.83, "learning_rate": 0.00025083536416853, "loss": 0.0629, "step": 72950 }, { "epoch": 1.83, "learning_rate": 0.0002504585081526518, "loss": 0.063, "step": 72960 }, { "epoch": 1.83, "learning_rate": 0.0002500816521367736, "loss": 0.0602, "step": 72970 }, { "epoch": 1.83, "learning_rate": 0.0002497047961208954, "loss": 0.0601, "step": 72980 }, { "epoch": 1.83, "learning_rate": 0.0002493279401050172, "loss": 0.0614, "step": 72990 }, { "epoch": 1.83, "learning_rate": 0.00024895108408913905, "loss": 0.0631, "step": 73000 }, { "epoch": 1.83, "eval_cer": 0.6650651321193817, "eval_loss": 0.053635094314813614, "eval_runtime": 90.7023, "eval_samples_per_second": 110.24, "eval_steps_per_second": 6.891, "step": 73000 }, { "epoch": 1.83, "learning_rate": 0.00024857422807326085, "loss": 0.0621, "step": 73010 }, { "epoch": 1.83, "learning_rate": 0.00024819737205738265, "loss": 0.0643, "step": 73020 }, { "epoch": 1.83, "learning_rate": 0.00024782051604150445, "loss": 0.0621, "step": 73030 }, { "epoch": 1.84, "learning_rate": 0.0002474436600256262, "loss": 0.0642, "step": 73040 }, { "epoch": 1.84, "learning_rate": 0.000247066804009748, "loss": 0.0633, "step": 73050 }, { "epoch": 1.84, "learning_rate": 0.0002466899479938698, "loss": 0.0609, "step": 73060 }, { "epoch": 1.84, "learning_rate": 0.0002463130919779916, "loss": 0.0606, "step": 73070 }, { "epoch": 1.84, "learning_rate": 0.0002459362359621134, "loss": 0.0594, "step": 73080 }, { "epoch": 1.84, "learning_rate": 0.00024555937994623524, "loss": 0.059, "step": 73090 }, { "epoch": 1.84, "learning_rate": 0.00024518252393035704, "loss": 0.0631, "step": 73100 }, { "epoch": 1.84, "learning_rate": 0.00024480566791447884, "loss": 0.0625, "step": 73110 }, { "epoch": 1.84, "learning_rate": 0.00024442881189860064, "loss": 0.064, "step": 73120 }, { "epoch": 1.84, "learning_rate": 0.00024405195588272243, "loss": 0.0611, "step": 73130 }, { "epoch": 1.84, "learning_rate": 0.00024367509986684423, "loss": 0.0629, "step": 73140 }, { "epoch": 1.84, "learning_rate": 0.000243298243850966, "loss": 0.0627, "step": 73150 }, { "epoch": 1.84, "learning_rate": 0.0002429213878350878, "loss": 0.0621, "step": 73160 }, { "epoch": 1.84, "learning_rate": 0.0002425445318192096, "loss": 0.0617, "step": 73170 }, { "epoch": 1.84, "learning_rate": 0.0002421676758033314, "loss": 0.0608, "step": 73180 }, { "epoch": 1.84, "learning_rate": 0.0002417908197874532, "loss": 0.0624, "step": 73190 }, { "epoch": 1.84, "learning_rate": 0.00024141396377157503, "loss": 0.0643, "step": 73200 }, { "epoch": 1.84, "learning_rate": 0.00024103710775569682, "loss": 0.0623, "step": 73210 }, { "epoch": 1.84, "learning_rate": 0.00024066025173981862, "loss": 0.0618, "step": 73220 }, { "epoch": 1.84, "learning_rate": 0.00024028339572394042, "loss": 0.0609, "step": 73230 }, { "epoch": 1.84, "learning_rate": 0.00023990653970806222, "loss": 0.0597, "step": 73240 }, { "epoch": 1.84, "learning_rate": 0.00023952968369218402, "loss": 0.065, "step": 73250 }, { "epoch": 1.84, "learning_rate": 0.0002391528276763058, "loss": 0.0639, "step": 73260 }, { "epoch": 1.84, "learning_rate": 0.0002387759716604276, "loss": 0.0597, "step": 73270 }, { "epoch": 1.84, "learning_rate": 0.0002383991156445494, "loss": 0.0617, "step": 73280 }, { "epoch": 1.84, "learning_rate": 0.00023802225962867122, "loss": 0.0646, "step": 73290 }, { "epoch": 1.84, "learning_rate": 0.00023764540361279301, "loss": 0.0568, "step": 73300 }, { "epoch": 1.84, "learning_rate": 0.0002372685475969148, "loss": 0.06, "step": 73310 }, { "epoch": 1.84, "learning_rate": 0.0002368916915810366, "loss": 0.0624, "step": 73320 }, { "epoch": 1.84, "learning_rate": 0.0002365148355651584, "loss": 0.0653, "step": 73330 }, { "epoch": 1.84, "learning_rate": 0.0002361379795492802, "loss": 0.0644, "step": 73340 }, { "epoch": 1.84, "learning_rate": 0.00023576112353340204, "loss": 0.0611, "step": 73350 }, { "epoch": 1.84, "learning_rate": 0.00023538426751752383, "loss": 0.0641, "step": 73360 }, { "epoch": 1.84, "learning_rate": 0.00023500741150164558, "loss": 0.0611, "step": 73370 }, { "epoch": 1.84, "learning_rate": 0.0002346305554857674, "loss": 0.0613, "step": 73380 }, { "epoch": 1.84, "learning_rate": 0.0002342536994698892, "loss": 0.0643, "step": 73390 }, { "epoch": 1.84, "learning_rate": 0.000233876843454011, "loss": 0.0631, "step": 73400 }, { "epoch": 1.84, "learning_rate": 0.0002334999874381328, "loss": 0.0676, "step": 73410 }, { "epoch": 1.84, "learning_rate": 0.0002331231314222546, "loss": 0.0632, "step": 73420 }, { "epoch": 1.84, "learning_rate": 0.0002327462754063764, "loss": 0.0612, "step": 73430 }, { "epoch": 1.85, "learning_rate": 0.00023236941939049822, "loss": 0.0634, "step": 73440 }, { "epoch": 1.85, "learning_rate": 0.00023199256337462002, "loss": 0.0617, "step": 73450 }, { "epoch": 1.85, "learning_rate": 0.00023161570735874182, "loss": 0.0628, "step": 73460 }, { "epoch": 1.85, "learning_rate": 0.00023123885134286362, "loss": 0.0638, "step": 73470 }, { "epoch": 1.85, "learning_rate": 0.0002308619953269854, "loss": 0.0617, "step": 73480 }, { "epoch": 1.85, "learning_rate": 0.0002304851393111072, "loss": 0.0626, "step": 73490 }, { "epoch": 1.85, "learning_rate": 0.000230108283295229, "loss": 0.0614, "step": 73500 }, { "epoch": 1.85, "eval_cer": 0.6650766816473669, "eval_loss": 0.05350416526198387, "eval_runtime": 90.6695, "eval_samples_per_second": 110.28, "eval_steps_per_second": 6.893, "step": 73500 }, { "epoch": 1.85, "learning_rate": 0.0002297314272793508, "loss": 0.0602, "step": 73510 }, { "epoch": 1.85, "learning_rate": 0.00022935457126347262, "loss": 0.0594, "step": 73520 }, { "epoch": 1.85, "learning_rate": 0.00022897771524759441, "loss": 0.0626, "step": 73530 }, { "epoch": 1.85, "learning_rate": 0.0002286008592317162, "loss": 0.0614, "step": 73540 }, { "epoch": 1.85, "learning_rate": 0.000228224003215838, "loss": 0.0646, "step": 73550 }, { "epoch": 1.85, "learning_rate": 0.0002278471471999598, "loss": 0.0639, "step": 73560 }, { "epoch": 1.85, "learning_rate": 0.0002274702911840816, "loss": 0.0618, "step": 73570 }, { "epoch": 1.85, "learning_rate": 0.00022709343516820344, "loss": 0.0637, "step": 73580 }, { "epoch": 1.85, "learning_rate": 0.00022671657915232518, "loss": 0.0614, "step": 73590 }, { "epoch": 1.85, "learning_rate": 0.00022633972313644698, "loss": 0.0609, "step": 73600 }, { "epoch": 1.85, "learning_rate": 0.0002259628671205688, "loss": 0.0601, "step": 73610 }, { "epoch": 1.85, "learning_rate": 0.0002255860111046906, "loss": 0.0569, "step": 73620 }, { "epoch": 1.85, "learning_rate": 0.0002252091550888124, "loss": 0.0641, "step": 73630 }, { "epoch": 1.85, "learning_rate": 0.0002248322990729342, "loss": 0.0613, "step": 73640 }, { "epoch": 1.85, "learning_rate": 0.000224455443057056, "loss": 0.0633, "step": 73650 }, { "epoch": 1.85, "learning_rate": 0.0002240785870411778, "loss": 0.0618, "step": 73660 }, { "epoch": 1.85, "learning_rate": 0.00022370173102529963, "loss": 0.0619, "step": 73670 }, { "epoch": 1.85, "learning_rate": 0.00022332487500942142, "loss": 0.0642, "step": 73680 }, { "epoch": 1.85, "learning_rate": 0.00022294801899354322, "loss": 0.0618, "step": 73690 }, { "epoch": 1.85, "learning_rate": 0.000222571162977665, "loss": 0.0605, "step": 73700 }, { "epoch": 1.85, "learning_rate": 0.0002221943069617868, "loss": 0.0658, "step": 73710 }, { "epoch": 1.85, "learning_rate": 0.0002218174509459086, "loss": 0.0605, "step": 73720 }, { "epoch": 1.85, "learning_rate": 0.0002214405949300304, "loss": 0.0638, "step": 73730 }, { "epoch": 1.85, "learning_rate": 0.0002210637389141522, "loss": 0.062, "step": 73740 }, { "epoch": 1.85, "learning_rate": 0.000220686882898274, "loss": 0.0607, "step": 73750 }, { "epoch": 1.85, "learning_rate": 0.00022031002688239581, "loss": 0.0656, "step": 73760 }, { "epoch": 1.85, "learning_rate": 0.00021993317086651761, "loss": 0.06, "step": 73770 }, { "epoch": 1.85, "learning_rate": 0.0002195563148506394, "loss": 0.0642, "step": 73780 }, { "epoch": 1.85, "learning_rate": 0.0002191794588347612, "loss": 0.0611, "step": 73790 }, { "epoch": 1.85, "learning_rate": 0.000218802602818883, "loss": 0.062, "step": 73800 }, { "epoch": 1.85, "learning_rate": 0.00021842574680300484, "loss": 0.0585, "step": 73810 }, { "epoch": 1.85, "learning_rate": 0.00021804889078712658, "loss": 0.0629, "step": 73820 }, { "epoch": 1.85, "learning_rate": 0.00021767203477124838, "loss": 0.0611, "step": 73830 }, { "epoch": 1.86, "learning_rate": 0.0002172951787553702, "loss": 0.0585, "step": 73840 }, { "epoch": 1.86, "learning_rate": 0.000216918322739492, "loss": 0.0621, "step": 73850 }, { "epoch": 1.86, "learning_rate": 0.0002165414667236138, "loss": 0.0632, "step": 73860 }, { "epoch": 1.86, "learning_rate": 0.0002161646107077356, "loss": 0.0565, "step": 73870 }, { "epoch": 1.86, "learning_rate": 0.0002157877546918574, "loss": 0.062, "step": 73880 }, { "epoch": 1.86, "learning_rate": 0.0002154108986759792, "loss": 0.0601, "step": 73890 }, { "epoch": 1.86, "learning_rate": 0.00021503404266010103, "loss": 0.0619, "step": 73900 }, { "epoch": 1.86, "learning_rate": 0.00021465718664422282, "loss": 0.0621, "step": 73910 }, { "epoch": 1.86, "learning_rate": 0.00021428033062834462, "loss": 0.063, "step": 73920 }, { "epoch": 1.86, "learning_rate": 0.0002139034746124664, "loss": 0.0603, "step": 73930 }, { "epoch": 1.86, "learning_rate": 0.0002135266185965882, "loss": 0.0611, "step": 73940 }, { "epoch": 1.86, "learning_rate": 0.00021314976258071, "loss": 0.0607, "step": 73950 }, { "epoch": 1.86, "learning_rate": 0.0002127729065648318, "loss": 0.0608, "step": 73960 }, { "epoch": 1.86, "learning_rate": 0.0002123960505489536, "loss": 0.0646, "step": 73970 }, { "epoch": 1.86, "learning_rate": 0.0002120191945330754, "loss": 0.0626, "step": 73980 }, { "epoch": 1.86, "learning_rate": 0.00021164233851719722, "loss": 0.0613, "step": 73990 }, { "epoch": 1.86, "learning_rate": 0.00021126548250131901, "loss": 0.0637, "step": 74000 }, { "epoch": 1.86, "eval_cer": 0.6652446310334854, "eval_loss": 0.05332941189408302, "eval_runtime": 90.5983, "eval_samples_per_second": 110.366, "eval_steps_per_second": 6.899, "step": 74000 }, { "epoch": 1.86, "learning_rate": 0.0002108886264854408, "loss": 0.0586, "step": 74010 }, { "epoch": 1.86, "learning_rate": 0.0002105117704695626, "loss": 0.0622, "step": 74020 }, { "epoch": 1.86, "learning_rate": 0.0002101349144536844, "loss": 0.0609, "step": 74030 }, { "epoch": 1.86, "learning_rate": 0.00020975805843780618, "loss": 0.0626, "step": 74040 }, { "epoch": 1.86, "learning_rate": 0.00020938120242192798, "loss": 0.0623, "step": 74050 }, { "epoch": 1.86, "learning_rate": 0.00020900434640604978, "loss": 0.0624, "step": 74060 }, { "epoch": 1.86, "learning_rate": 0.0002086274903901716, "loss": 0.0633, "step": 74070 }, { "epoch": 1.86, "learning_rate": 0.0002082506343742934, "loss": 0.0606, "step": 74080 }, { "epoch": 1.86, "learning_rate": 0.0002078737783584152, "loss": 0.0606, "step": 74090 }, { "epoch": 1.86, "learning_rate": 0.000207496922342537, "loss": 0.0625, "step": 74100 }, { "epoch": 1.86, "learning_rate": 0.0002071200663266588, "loss": 0.0605, "step": 74110 }, { "epoch": 1.86, "learning_rate": 0.0002067432103107806, "loss": 0.0646, "step": 74120 }, { "epoch": 1.86, "learning_rate": 0.00020636635429490243, "loss": 0.0629, "step": 74130 }, { "epoch": 1.86, "learning_rate": 0.00020598949827902422, "loss": 0.0647, "step": 74140 }, { "epoch": 1.86, "learning_rate": 0.00020561264226314597, "loss": 0.0641, "step": 74150 }, { "epoch": 1.86, "learning_rate": 0.0002052357862472678, "loss": 0.061, "step": 74160 }, { "epoch": 1.86, "learning_rate": 0.0002048589302313896, "loss": 0.0626, "step": 74170 }, { "epoch": 1.86, "learning_rate": 0.0002044820742155114, "loss": 0.061, "step": 74180 }, { "epoch": 1.86, "learning_rate": 0.0002041052181996332, "loss": 0.0581, "step": 74190 }, { "epoch": 1.86, "learning_rate": 0.000203728362183755, "loss": 0.0625, "step": 74200 }, { "epoch": 1.86, "learning_rate": 0.0002033515061678768, "loss": 0.0598, "step": 74210 }, { "epoch": 1.86, "learning_rate": 0.00020297465015199862, "loss": 0.0641, "step": 74220 }, { "epoch": 1.86, "learning_rate": 0.00020259779413612041, "loss": 0.0615, "step": 74230 }, { "epoch": 1.87, "learning_rate": 0.0002022209381202422, "loss": 0.0638, "step": 74240 }, { "epoch": 1.87, "learning_rate": 0.000201844082104364, "loss": 0.0621, "step": 74250 }, { "epoch": 1.87, "learning_rate": 0.00020146722608848578, "loss": 0.0626, "step": 74260 }, { "epoch": 1.87, "learning_rate": 0.00020109037007260758, "loss": 0.0625, "step": 74270 }, { "epoch": 1.87, "learning_rate": 0.00020071351405672938, "loss": 0.0633, "step": 74280 }, { "epoch": 1.87, "learning_rate": 0.00020033665804085118, "loss": 0.062, "step": 74290 }, { "epoch": 1.87, "learning_rate": 0.00019995980202497298, "loss": 0.0593, "step": 74300 }, { "epoch": 1.87, "learning_rate": 0.0001995829460090948, "loss": 0.0612, "step": 74310 }, { "epoch": 1.87, "learning_rate": 0.0001992060899932166, "loss": 0.0609, "step": 74320 }, { "epoch": 1.87, "learning_rate": 0.0001988292339773384, "loss": 0.0638, "step": 74330 }, { "epoch": 1.87, "learning_rate": 0.0001984523779614602, "loss": 0.0621, "step": 74340 }, { "epoch": 1.87, "learning_rate": 0.000198075521945582, "loss": 0.0627, "step": 74350 }, { "epoch": 1.87, "learning_rate": 0.00019769866592970383, "loss": 0.0624, "step": 74360 }, { "epoch": 1.87, "learning_rate": 0.00019732180991382557, "loss": 0.0619, "step": 74370 }, { "epoch": 1.87, "learning_rate": 0.00019694495389794737, "loss": 0.0622, "step": 74380 }, { "epoch": 1.87, "learning_rate": 0.0001965680978820692, "loss": 0.0612, "step": 74390 }, { "epoch": 1.87, "learning_rate": 0.000196191241866191, "loss": 0.0639, "step": 74400 }, { "epoch": 1.87, "learning_rate": 0.0001958143858503128, "loss": 0.0642, "step": 74410 }, { "epoch": 1.87, "learning_rate": 0.0001954375298344346, "loss": 0.0624, "step": 74420 }, { "epoch": 1.87, "learning_rate": 0.0001950606738185564, "loss": 0.06, "step": 74430 }, { "epoch": 1.87, "learning_rate": 0.0001946838178026782, "loss": 0.0627, "step": 74440 }, { "epoch": 1.87, "learning_rate": 0.00019430696178680002, "loss": 0.0621, "step": 74450 }, { "epoch": 1.87, "learning_rate": 0.00019393010577092181, "loss": 0.0616, "step": 74460 }, { "epoch": 1.87, "learning_rate": 0.0001935532497550436, "loss": 0.0637, "step": 74470 }, { "epoch": 1.87, "learning_rate": 0.00019317639373916539, "loss": 0.0612, "step": 74480 }, { "epoch": 1.87, "learning_rate": 0.00019279953772328718, "loss": 0.0613, "step": 74490 }, { "epoch": 1.87, "learning_rate": 0.00019242268170740898, "loss": 0.0619, "step": 74500 }, { "epoch": 1.87, "eval_cer": 0.6651796649385685, "eval_loss": 0.05317223444581032, "eval_runtime": 90.7609, "eval_samples_per_second": 110.169, "eval_steps_per_second": 6.886, "step": 74500 }, { "epoch": 1.87, "learning_rate": 0.00019204582569153078, "loss": 0.0611, "step": 74510 }, { "epoch": 1.87, "learning_rate": 0.00019166896967565258, "loss": 0.0631, "step": 74520 }, { "epoch": 1.87, "learning_rate": 0.00019129211365977438, "loss": 0.0604, "step": 74530 }, { "epoch": 1.87, "learning_rate": 0.0001909152576438962, "loss": 0.0617, "step": 74540 }, { "epoch": 1.87, "learning_rate": 0.000190538401628018, "loss": 0.0622, "step": 74550 }, { "epoch": 1.87, "learning_rate": 0.0001901615456121398, "loss": 0.0611, "step": 74560 }, { "epoch": 1.87, "learning_rate": 0.0001897846895962616, "loss": 0.0623, "step": 74570 }, { "epoch": 1.87, "learning_rate": 0.0001894078335803834, "loss": 0.0642, "step": 74580 }, { "epoch": 1.87, "learning_rate": 0.00018903097756450517, "loss": 0.0606, "step": 74590 }, { "epoch": 1.87, "learning_rate": 0.00018865412154862697, "loss": 0.061, "step": 74600 }, { "epoch": 1.87, "learning_rate": 0.00018827726553274877, "loss": 0.0626, "step": 74610 }, { "epoch": 1.87, "learning_rate": 0.00018790040951687057, "loss": 0.0606, "step": 74620 }, { "epoch": 1.87, "learning_rate": 0.0001875235535009924, "loss": 0.063, "step": 74630 }, { "epoch": 1.88, "learning_rate": 0.0001871466974851142, "loss": 0.0589, "step": 74640 }, { "epoch": 1.88, "learning_rate": 0.000186769841469236, "loss": 0.0607, "step": 74650 }, { "epoch": 1.88, "learning_rate": 0.0001863929854533578, "loss": 0.0611, "step": 74660 }, { "epoch": 1.88, "learning_rate": 0.0001860161294374796, "loss": 0.0629, "step": 74670 }, { "epoch": 1.88, "learning_rate": 0.0001856392734216014, "loss": 0.0618, "step": 74680 }, { "epoch": 1.88, "learning_rate": 0.0001852624174057232, "loss": 0.058, "step": 74690 }, { "epoch": 1.88, "learning_rate": 0.000184885561389845, "loss": 0.0639, "step": 74700 }, { "epoch": 1.88, "learning_rate": 0.00018450870537396679, "loss": 0.0637, "step": 74710 }, { "epoch": 1.88, "learning_rate": 0.00018413184935808858, "loss": 0.0634, "step": 74720 }, { "epoch": 1.88, "learning_rate": 0.00018375499334221038, "loss": 0.0567, "step": 74730 }, { "epoch": 1.88, "learning_rate": 0.00018337813732633218, "loss": 0.0576, "step": 74740 }, { "epoch": 1.88, "learning_rate": 0.00018300128131045398, "loss": 0.0599, "step": 74750 }, { "epoch": 1.88, "learning_rate": 0.00018262442529457578, "loss": 0.0596, "step": 74760 }, { "epoch": 1.88, "learning_rate": 0.0001822475692786976, "loss": 0.0616, "step": 74770 }, { "epoch": 1.88, "learning_rate": 0.0001818707132628194, "loss": 0.0602, "step": 74780 }, { "epoch": 1.88, "learning_rate": 0.00018149385724694118, "loss": 0.0604, "step": 74790 }, { "epoch": 1.88, "learning_rate": 0.00018111700123106298, "loss": 0.0608, "step": 74800 }, { "epoch": 1.88, "learning_rate": 0.0001807401452151848, "loss": 0.0638, "step": 74810 }, { "epoch": 1.88, "learning_rate": 0.0001803632891993066, "loss": 0.0636, "step": 74820 }, { "epoch": 1.88, "learning_rate": 0.0001799864331834284, "loss": 0.0595, "step": 74830 }, { "epoch": 1.88, "learning_rate": 0.00017960957716755017, "loss": 0.0616, "step": 74840 }, { "epoch": 1.88, "learning_rate": 0.00017923272115167197, "loss": 0.0611, "step": 74850 }, { "epoch": 1.88, "learning_rate": 0.0001788558651357938, "loss": 0.0591, "step": 74860 }, { "epoch": 1.88, "learning_rate": 0.0001784790091199156, "loss": 0.0575, "step": 74870 }, { "epoch": 1.88, "learning_rate": 0.0001781021531040374, "loss": 0.0632, "step": 74880 }, { "epoch": 1.88, "learning_rate": 0.0001777252970881592, "loss": 0.062, "step": 74890 }, { "epoch": 1.88, "learning_rate": 0.000177348441072281, "loss": 0.0615, "step": 74900 }, { "epoch": 1.88, "learning_rate": 0.0001769715850564028, "loss": 0.0619, "step": 74910 }, { "epoch": 1.88, "learning_rate": 0.0001765947290405246, "loss": 0.0614, "step": 74920 }, { "epoch": 1.88, "learning_rate": 0.0001762178730246464, "loss": 0.0631, "step": 74930 }, { "epoch": 1.88, "learning_rate": 0.00017584101700876819, "loss": 0.0608, "step": 74940 }, { "epoch": 1.88, "learning_rate": 0.00017546416099288998, "loss": 0.0625, "step": 74950 }, { "epoch": 1.88, "learning_rate": 0.00017508730497701178, "loss": 0.063, "step": 74960 }, { "epoch": 1.88, "learning_rate": 0.00017471044896113358, "loss": 0.059, "step": 74970 }, { "epoch": 1.88, "learning_rate": 0.00017433359294525538, "loss": 0.0625, "step": 74980 }, { "epoch": 1.88, "learning_rate": 0.00017395673692937718, "loss": 0.063, "step": 74990 }, { "epoch": 1.88, "learning_rate": 0.000173579880913499, "loss": 0.061, "step": 75000 }, { "epoch": 1.88, "eval_cer": 0.6652123886011934, "eval_loss": 0.053149040788412094, "eval_runtime": 90.705, "eval_samples_per_second": 110.236, "eval_steps_per_second": 6.89, "step": 75000 }, { "epoch": 1.88, "learning_rate": 0.00017320302489762078, "loss": 0.0612, "step": 75010 }, { "epoch": 1.88, "learning_rate": 0.00017282616888174258, "loss": 0.0604, "step": 75020 }, { "epoch": 1.89, "learning_rate": 0.00017244931286586438, "loss": 0.0622, "step": 75030 }, { "epoch": 1.89, "learning_rate": 0.0001720724568499862, "loss": 0.0589, "step": 75040 }, { "epoch": 1.89, "learning_rate": 0.000171695600834108, "loss": 0.0621, "step": 75050 }, { "epoch": 1.89, "learning_rate": 0.0001713187448182298, "loss": 0.0597, "step": 75060 }, { "epoch": 1.89, "learning_rate": 0.00017094188880235157, "loss": 0.0618, "step": 75070 }, { "epoch": 1.89, "learning_rate": 0.00017056503278647337, "loss": 0.0644, "step": 75080 }, { "epoch": 1.89, "learning_rate": 0.0001701881767705952, "loss": 0.0632, "step": 75090 }, { "epoch": 1.89, "learning_rate": 0.000169811320754717, "loss": 0.0613, "step": 75100 }, { "epoch": 1.89, "learning_rate": 0.0001694344647388388, "loss": 0.0642, "step": 75110 }, { "epoch": 1.89, "learning_rate": 0.00016905760872296056, "loss": 0.0618, "step": 75120 }, { "epoch": 1.89, "learning_rate": 0.0001686807527070824, "loss": 0.0571, "step": 75130 }, { "epoch": 1.89, "learning_rate": 0.0001683038966912042, "loss": 0.0607, "step": 75140 }, { "epoch": 1.89, "learning_rate": 0.000167927040675326, "loss": 0.0586, "step": 75150 }, { "epoch": 1.89, "learning_rate": 0.0001675501846594478, "loss": 0.0608, "step": 75160 }, { "epoch": 1.89, "learning_rate": 0.00016717332864356959, "loss": 0.0623, "step": 75170 }, { "epoch": 1.89, "learning_rate": 0.00016679647262769139, "loss": 0.0565, "step": 75180 }, { "epoch": 1.89, "learning_rate": 0.00016641961661181318, "loss": 0.0645, "step": 75190 }, { "epoch": 1.89, "learning_rate": 0.00016604276059593498, "loss": 0.0638, "step": 75200 }, { "epoch": 1.89, "learning_rate": 0.00016566590458005678, "loss": 0.0612, "step": 75210 }, { "epoch": 1.89, "learning_rate": 0.00016528904856417858, "loss": 0.0626, "step": 75220 }, { "epoch": 1.89, "learning_rate": 0.00016491219254830038, "loss": 0.0621, "step": 75230 }, { "epoch": 1.89, "learning_rate": 0.00016453533653242218, "loss": 0.0595, "step": 75240 }, { "epoch": 1.89, "learning_rate": 0.00016415848051654398, "loss": 0.0615, "step": 75250 }, { "epoch": 1.89, "learning_rate": 0.00016378162450066578, "loss": 0.0623, "step": 75260 }, { "epoch": 1.89, "learning_rate": 0.00016340476848478757, "loss": 0.0596, "step": 75270 }, { "epoch": 1.89, "learning_rate": 0.0001630279124689094, "loss": 0.0609, "step": 75280 }, { "epoch": 1.89, "learning_rate": 0.00016265105645303117, "loss": 0.06, "step": 75290 }, { "epoch": 1.89, "learning_rate": 0.00016227420043715297, "loss": 0.0614, "step": 75300 }, { "epoch": 1.89, "learning_rate": 0.00016189734442127477, "loss": 0.0612, "step": 75310 }, { "epoch": 1.89, "learning_rate": 0.0001615204884053966, "loss": 0.0614, "step": 75320 }, { "epoch": 1.89, "learning_rate": 0.0001611436323895184, "loss": 0.0606, "step": 75330 }, { "epoch": 1.89, "learning_rate": 0.00016076677637364017, "loss": 0.0606, "step": 75340 }, { "epoch": 1.89, "learning_rate": 0.00016038992035776197, "loss": 0.0597, "step": 75350 }, { "epoch": 1.89, "learning_rate": 0.0001600130643418838, "loss": 0.0607, "step": 75360 }, { "epoch": 1.89, "learning_rate": 0.0001596362083260056, "loss": 0.0606, "step": 75370 }, { "epoch": 1.89, "learning_rate": 0.0001592593523101274, "loss": 0.0601, "step": 75380 }, { "epoch": 1.89, "learning_rate": 0.0001588824962942492, "loss": 0.0634, "step": 75390 }, { "epoch": 1.89, "learning_rate": 0.00015850564027837096, "loss": 0.0597, "step": 75400 }, { "epoch": 1.89, "learning_rate": 0.00015812878426249279, "loss": 0.0604, "step": 75410 }, { "epoch": 1.89, "learning_rate": 0.00015775192824661458, "loss": 0.0585, "step": 75420 }, { "epoch": 1.9, "learning_rate": 0.00015737507223073638, "loss": 0.0598, "step": 75430 }, { "epoch": 1.9, "learning_rate": 0.00015699821621485818, "loss": 0.0601, "step": 75440 }, { "epoch": 1.9, "learning_rate": 0.00015662136019897998, "loss": 0.0603, "step": 75450 }, { "epoch": 1.9, "learning_rate": 0.00015624450418310178, "loss": 0.0614, "step": 75460 }, { "epoch": 1.9, "learning_rate": 0.00015586764816722358, "loss": 0.0635, "step": 75470 }, { "epoch": 1.9, "learning_rate": 0.00015549079215134538, "loss": 0.0631, "step": 75480 }, { "epoch": 1.9, "learning_rate": 0.00015511393613546718, "loss": 0.062, "step": 75490 }, { "epoch": 1.9, "learning_rate": 0.00015473708011958897, "loss": 0.0598, "step": 75500 }, { "epoch": 1.9, "eval_cer": 0.6651926581575519, "eval_loss": 0.05298503488302231, "eval_runtime": 91.1794, "eval_samples_per_second": 109.663, "eval_steps_per_second": 6.855, "step": 75500 }, { "epoch": 1.9, "learning_rate": 0.00015436022410371077, "loss": 0.0576, "step": 75510 }, { "epoch": 1.9, "learning_rate": 0.00015398336808783257, "loss": 0.062, "step": 75520 }, { "epoch": 1.9, "learning_rate": 0.00015360651207195437, "loss": 0.061, "step": 75530 }, { "epoch": 1.9, "learning_rate": 0.00015322965605607617, "loss": 0.0636, "step": 75540 }, { "epoch": 1.9, "learning_rate": 0.000152852800040198, "loss": 0.0624, "step": 75550 }, { "epoch": 1.9, "learning_rate": 0.0001524759440243198, "loss": 0.061, "step": 75560 }, { "epoch": 1.9, "learning_rate": 0.00015209908800844157, "loss": 0.0629, "step": 75570 }, { "epoch": 1.9, "learning_rate": 0.00015172223199256337, "loss": 0.0599, "step": 75580 }, { "epoch": 1.9, "learning_rate": 0.00015134537597668516, "loss": 0.0635, "step": 75590 }, { "epoch": 1.9, "learning_rate": 0.000150968519960807, "loss": 0.0559, "step": 75600 }, { "epoch": 1.9, "learning_rate": 0.0001505916639449288, "loss": 0.0611, "step": 75610 }, { "epoch": 1.9, "learning_rate": 0.00015021480792905056, "loss": 0.059, "step": 75620 }, { "epoch": 1.9, "learning_rate": 0.00014983795191317236, "loss": 0.0613, "step": 75630 }, { "epoch": 1.9, "learning_rate": 0.00014946109589729419, "loss": 0.0604, "step": 75640 }, { "epoch": 1.9, "learning_rate": 0.00014908423988141598, "loss": 0.0607, "step": 75650 }, { "epoch": 1.9, "learning_rate": 0.00014870738386553778, "loss": 0.0605, "step": 75660 }, { "epoch": 1.9, "learning_rate": 0.00014833052784965958, "loss": 0.0626, "step": 75670 }, { "epoch": 1.9, "learning_rate": 0.00014795367183378138, "loss": 0.0625, "step": 75680 }, { "epoch": 1.9, "learning_rate": 0.00014757681581790318, "loss": 0.0585, "step": 75690 }, { "epoch": 1.9, "learning_rate": 0.00014719995980202498, "loss": 0.0611, "step": 75700 }, { "epoch": 1.9, "learning_rate": 0.00014682310378614678, "loss": 0.0623, "step": 75710 }, { "epoch": 1.9, "learning_rate": 0.00014644624777026858, "loss": 0.0605, "step": 75720 }, { "epoch": 1.9, "learning_rate": 0.00014606939175439038, "loss": 0.0613, "step": 75730 }, { "epoch": 1.9, "learning_rate": 0.00014569253573851217, "loss": 0.0619, "step": 75740 }, { "epoch": 1.9, "learning_rate": 0.00014531567972263397, "loss": 0.0607, "step": 75750 }, { "epoch": 1.9, "learning_rate": 0.00014493882370675577, "loss": 0.06, "step": 75760 }, { "epoch": 1.9, "learning_rate": 0.00014456196769087757, "loss": 0.0591, "step": 75770 }, { "epoch": 1.9, "learning_rate": 0.0001441851116749994, "loss": 0.0616, "step": 75780 }, { "epoch": 1.9, "learning_rate": 0.00014380825565912117, "loss": 0.0623, "step": 75790 }, { "epoch": 1.9, "learning_rate": 0.00014343139964324297, "loss": 0.062, "step": 75800 }, { "epoch": 1.9, "learning_rate": 0.00014305454362736477, "loss": 0.0624, "step": 75810 }, { "epoch": 1.9, "learning_rate": 0.00014267768761148656, "loss": 0.0652, "step": 75820 }, { "epoch": 1.91, "learning_rate": 0.0001423008315956084, "loss": 0.0615, "step": 75830 }, { "epoch": 1.91, "learning_rate": 0.0001419239755797302, "loss": 0.0632, "step": 75840 }, { "epoch": 1.91, "learning_rate": 0.00014154711956385196, "loss": 0.0638, "step": 75850 }, { "epoch": 1.91, "learning_rate": 0.00014117026354797376, "loss": 0.0614, "step": 75860 }, { "epoch": 1.91, "learning_rate": 0.00014079340753209559, "loss": 0.061, "step": 75870 }, { "epoch": 1.91, "learning_rate": 0.00014041655151621738, "loss": 0.0582, "step": 75880 }, { "epoch": 1.91, "learning_rate": 0.00014003969550033918, "loss": 0.0615, "step": 75890 }, { "epoch": 1.91, "learning_rate": 0.00013966283948446096, "loss": 0.0606, "step": 75900 }, { "epoch": 1.91, "learning_rate": 0.00013928598346858275, "loss": 0.0621, "step": 75910 }, { "epoch": 1.91, "learning_rate": 0.00013890912745270458, "loss": 0.0597, "step": 75920 }, { "epoch": 1.91, "learning_rate": 0.00013853227143682638, "loss": 0.0597, "step": 75930 }, { "epoch": 1.91, "learning_rate": 0.00013815541542094818, "loss": 0.0604, "step": 75940 }, { "epoch": 1.91, "learning_rate": 0.00013777855940506998, "loss": 0.0604, "step": 75950 }, { "epoch": 1.91, "learning_rate": 0.00013740170338919178, "loss": 0.0605, "step": 75960 }, { "epoch": 1.91, "learning_rate": 0.00013702484737331357, "loss": 0.0639, "step": 75970 }, { "epoch": 1.91, "learning_rate": 0.00013664799135743537, "loss": 0.0634, "step": 75980 }, { "epoch": 1.91, "learning_rate": 0.00013627113534155717, "loss": 0.0606, "step": 75990 }, { "epoch": 1.91, "learning_rate": 0.00013589427932567897, "loss": 0.0643, "step": 76000 }, { "epoch": 1.91, "eval_cer": 0.6651921769272192, "eval_loss": 0.05285988375544548, "eval_runtime": 90.7457, "eval_samples_per_second": 110.187, "eval_steps_per_second": 6.887, "step": 76000 }, { "epoch": 1.91, "learning_rate": 0.00013551742330980077, "loss": 0.0622, "step": 76010 }, { "epoch": 1.91, "learning_rate": 0.00013514056729392257, "loss": 0.0618, "step": 76020 }, { "epoch": 1.91, "learning_rate": 0.00013476371127804437, "loss": 0.0587, "step": 76030 }, { "epoch": 1.91, "learning_rate": 0.00013438685526216617, "loss": 0.0587, "step": 76040 }, { "epoch": 1.91, "learning_rate": 0.00013400999924628797, "loss": 0.0647, "step": 76050 }, { "epoch": 1.91, "learning_rate": 0.0001336331432304098, "loss": 0.0577, "step": 76060 }, { "epoch": 1.91, "learning_rate": 0.00013325628721453156, "loss": 0.0638, "step": 76070 }, { "epoch": 1.91, "learning_rate": 0.00013287943119865336, "loss": 0.0638, "step": 76080 }, { "epoch": 1.91, "learning_rate": 0.00013250257518277516, "loss": 0.0592, "step": 76090 }, { "epoch": 1.91, "learning_rate": 0.00013212571916689699, "loss": 0.0623, "step": 76100 }, { "epoch": 1.91, "learning_rate": 0.00013174886315101879, "loss": 0.0623, "step": 76110 }, { "epoch": 1.91, "learning_rate": 0.00013137200713514056, "loss": 0.0616, "step": 76120 }, { "epoch": 1.91, "learning_rate": 0.00013099515111926236, "loss": 0.0626, "step": 76130 }, { "epoch": 1.91, "learning_rate": 0.00013061829510338415, "loss": 0.0611, "step": 76140 }, { "epoch": 1.91, "learning_rate": 0.00013024143908750598, "loss": 0.061, "step": 76150 }, { "epoch": 1.91, "learning_rate": 0.00012986458307162778, "loss": 0.0583, "step": 76160 }, { "epoch": 1.91, "learning_rate": 0.00012948772705574958, "loss": 0.0622, "step": 76170 }, { "epoch": 1.91, "learning_rate": 0.00012911087103987135, "loss": 0.0591, "step": 76180 }, { "epoch": 1.91, "learning_rate": 0.00012873401502399318, "loss": 0.0635, "step": 76190 }, { "epoch": 1.91, "learning_rate": 0.00012835715900811497, "loss": 0.0619, "step": 76200 }, { "epoch": 1.91, "learning_rate": 0.00012798030299223677, "loss": 0.0604, "step": 76210 }, { "epoch": 1.91, "learning_rate": 0.00012760344697635857, "loss": 0.0595, "step": 76220 }, { "epoch": 1.92, "learning_rate": 0.00012722659096048037, "loss": 0.0601, "step": 76230 }, { "epoch": 1.92, "learning_rate": 0.00012684973494460217, "loss": 0.0608, "step": 76240 }, { "epoch": 1.92, "learning_rate": 0.00012647287892872397, "loss": 0.0608, "step": 76250 }, { "epoch": 1.92, "learning_rate": 0.00012609602291284577, "loss": 0.0606, "step": 76260 }, { "epoch": 1.92, "learning_rate": 0.00012571916689696757, "loss": 0.0589, "step": 76270 }, { "epoch": 1.92, "learning_rate": 0.00012534231088108937, "loss": 0.0594, "step": 76280 }, { "epoch": 1.92, "learning_rate": 0.00012496545486521116, "loss": 0.0609, "step": 76290 }, { "epoch": 1.92, "learning_rate": 0.00012458859884933296, "loss": 0.0627, "step": 76300 }, { "epoch": 1.92, "learning_rate": 0.00012421174283345476, "loss": 0.0629, "step": 76310 }, { "epoch": 1.92, "learning_rate": 0.00012383488681757656, "loss": 0.0601, "step": 76320 }, { "epoch": 1.92, "learning_rate": 0.0001234580308016984, "loss": 0.0604, "step": 76330 }, { "epoch": 1.92, "learning_rate": 0.00012308117478582019, "loss": 0.0608, "step": 76340 }, { "epoch": 1.92, "learning_rate": 0.00012270431876994196, "loss": 0.0641, "step": 76350 }, { "epoch": 1.92, "learning_rate": 0.00012232746275406376, "loss": 0.0595, "step": 76360 }, { "epoch": 1.92, "learning_rate": 0.00012195060673818557, "loss": 0.0623, "step": 76370 }, { "epoch": 1.92, "learning_rate": 0.00012157375072230737, "loss": 0.0612, "step": 76380 }, { "epoch": 1.92, "learning_rate": 0.00012119689470642918, "loss": 0.0595, "step": 76390 }, { "epoch": 1.92, "learning_rate": 0.00012082003869055095, "loss": 0.0604, "step": 76400 }, { "epoch": 1.92, "learning_rate": 0.00012044318267467276, "loss": 0.0606, "step": 76410 }, { "epoch": 1.92, "learning_rate": 0.00012006632665879456, "loss": 0.0601, "step": 76420 }, { "epoch": 1.92, "learning_rate": 0.00011968947064291636, "loss": 0.0615, "step": 76430 }, { "epoch": 1.92, "learning_rate": 0.00011931261462703817, "loss": 0.0646, "step": 76440 }, { "epoch": 1.92, "learning_rate": 0.00011893575861115997, "loss": 0.0611, "step": 76450 }, { "epoch": 1.92, "learning_rate": 0.00011855890259528176, "loss": 0.0622, "step": 76460 }, { "epoch": 1.92, "learning_rate": 0.00011818204657940356, "loss": 0.0598, "step": 76470 }, { "epoch": 1.92, "learning_rate": 0.00011780519056352537, "loss": 0.0623, "step": 76480 }, { "epoch": 1.92, "learning_rate": 0.00011742833454764717, "loss": 0.0632, "step": 76490 }, { "epoch": 1.92, "learning_rate": 0.00011705147853176897, "loss": 0.0609, "step": 76500 }, { "epoch": 1.92, "eval_cer": 0.6651411665119511, "eval_loss": 0.05271696671843529, "eval_runtime": 90.4198, "eval_samples_per_second": 110.584, "eval_steps_per_second": 6.912, "step": 76500 }, { "epoch": 1.92, "learning_rate": 0.00011667462251589075, "loss": 0.0632, "step": 76510 }, { "epoch": 1.92, "learning_rate": 0.00011629776650001256, "loss": 0.0614, "step": 76520 }, { "epoch": 1.92, "learning_rate": 0.00011592091048413436, "loss": 0.064, "step": 76530 }, { "epoch": 1.92, "learning_rate": 0.00011554405446825616, "loss": 0.0609, "step": 76540 }, { "epoch": 1.92, "learning_rate": 0.00011516719845237797, "loss": 0.0604, "step": 76550 }, { "epoch": 1.92, "learning_rate": 0.00011479034243649977, "loss": 0.0609, "step": 76560 }, { "epoch": 1.92, "learning_rate": 0.00011441348642062156, "loss": 0.0631, "step": 76570 }, { "epoch": 1.92, "learning_rate": 0.00011403663040474336, "loss": 0.062, "step": 76580 }, { "epoch": 1.92, "learning_rate": 0.00011365977438886516, "loss": 0.0616, "step": 76590 }, { "epoch": 1.92, "learning_rate": 0.00011328291837298697, "loss": 0.059, "step": 76600 }, { "epoch": 1.92, "learning_rate": 0.00011290606235710877, "loss": 0.0602, "step": 76610 }, { "epoch": 1.92, "learning_rate": 0.00011252920634123055, "loss": 0.0621, "step": 76620 }, { "epoch": 1.93, "learning_rate": 0.00011215235032535235, "loss": 0.0595, "step": 76630 }, { "epoch": 1.93, "learning_rate": 0.00011177549430947416, "loss": 0.0604, "step": 76640 }, { "epoch": 1.93, "learning_rate": 0.00011139863829359596, "loss": 0.0627, "step": 76650 }, { "epoch": 1.93, "learning_rate": 0.00011102178227771776, "loss": 0.0638, "step": 76660 }, { "epoch": 1.93, "learning_rate": 0.00011064492626183957, "loss": 0.0595, "step": 76670 }, { "epoch": 1.93, "learning_rate": 0.00011026807024596136, "loss": 0.0613, "step": 76680 }, { "epoch": 1.93, "learning_rate": 0.00010989121423008316, "loss": 0.0623, "step": 76690 }, { "epoch": 1.93, "learning_rate": 0.00010951435821420496, "loss": 0.0575, "step": 76700 }, { "epoch": 1.93, "learning_rate": 0.00010913750219832677, "loss": 0.06, "step": 76710 }, { "epoch": 1.93, "learning_rate": 0.00010876064618244857, "loss": 0.0595, "step": 76720 }, { "epoch": 1.93, "learning_rate": 0.00010838379016657037, "loss": 0.0584, "step": 76730 }, { "epoch": 1.93, "learning_rate": 0.00010800693415069215, "loss": 0.0625, "step": 76740 }, { "epoch": 1.93, "learning_rate": 0.00010763007813481395, "loss": 0.064, "step": 76750 }, { "epoch": 1.93, "learning_rate": 0.00010725322211893576, "loss": 0.0598, "step": 76760 }, { "epoch": 1.93, "learning_rate": 0.00010687636610305756, "loss": 0.0615, "step": 76770 }, { "epoch": 1.93, "learning_rate": 0.00010649951008717938, "loss": 0.0612, "step": 76780 }, { "epoch": 1.93, "learning_rate": 0.00010612265407130115, "loss": 0.0629, "step": 76790 }, { "epoch": 1.93, "learning_rate": 0.00010574579805542296, "loss": 0.0595, "step": 76800 }, { "epoch": 1.93, "learning_rate": 0.00010536894203954476, "loss": 0.06, "step": 76810 }, { "epoch": 1.93, "learning_rate": 0.00010499208602366656, "loss": 0.061, "step": 76820 }, { "epoch": 1.93, "learning_rate": 0.00010461523000778837, "loss": 0.0628, "step": 76830 }, { "epoch": 1.93, "learning_rate": 0.00010423837399191017, "loss": 0.0576, "step": 76840 }, { "epoch": 1.93, "learning_rate": 0.00010386151797603195, "loss": 0.0618, "step": 76850 }, { "epoch": 1.93, "learning_rate": 0.00010348466196015375, "loss": 0.065, "step": 76860 }, { "epoch": 1.93, "learning_rate": 0.00010310780594427556, "loss": 0.0574, "step": 76870 }, { "epoch": 1.93, "learning_rate": 0.00010273094992839736, "loss": 0.0611, "step": 76880 }, { "epoch": 1.93, "learning_rate": 0.00010235409391251916, "loss": 0.0585, "step": 76890 }, { "epoch": 1.93, "learning_rate": 0.00010197723789664095, "loss": 0.0577, "step": 76900 }, { "epoch": 1.93, "learning_rate": 0.00010160038188076275, "loss": 0.0619, "step": 76910 }, { "epoch": 1.93, "learning_rate": 0.00010122352586488456, "loss": 0.0609, "step": 76920 }, { "epoch": 1.93, "learning_rate": 0.00010084666984900636, "loss": 0.062, "step": 76930 }, { "epoch": 1.93, "learning_rate": 0.00010046981383312817, "loss": 0.0603, "step": 76940 }, { "epoch": 1.93, "learning_rate": 0.00010009295781724997, "loss": 0.0619, "step": 76950 }, { "epoch": 1.93, "learning_rate": 9.971610180137175e-05, "loss": 0.0619, "step": 76960 }, { "epoch": 1.93, "learning_rate": 9.933924578549355e-05, "loss": 0.0612, "step": 76970 }, { "epoch": 1.93, "learning_rate": 9.896238976961535e-05, "loss": 0.0588, "step": 76980 }, { "epoch": 1.93, "learning_rate": 9.858553375373716e-05, "loss": 0.0613, "step": 76990 }, { "epoch": 1.93, "learning_rate": 9.820867773785896e-05, "loss": 0.06, "step": 77000 }, { "epoch": 1.93, "eval_cer": 0.6651647467982543, "eval_loss": 0.05269329249858856, "eval_runtime": 90.4414, "eval_samples_per_second": 110.558, "eval_steps_per_second": 6.911, "step": 77000 }, { "epoch": 1.93, "learning_rate": 9.783182172198075e-05, "loss": 0.059, "step": 77010 }, { "epoch": 1.93, "learning_rate": 9.745496570610255e-05, "loss": 0.0612, "step": 77020 }, { "epoch": 1.94, "learning_rate": 9.707810969022436e-05, "loss": 0.0594, "step": 77030 }, { "epoch": 1.94, "learning_rate": 9.670125367434616e-05, "loss": 0.0599, "step": 77040 }, { "epoch": 1.94, "learning_rate": 9.632439765846796e-05, "loss": 0.0639, "step": 77050 }, { "epoch": 1.94, "learning_rate": 9.594754164258977e-05, "loss": 0.0599, "step": 77060 }, { "epoch": 1.94, "learning_rate": 9.557068562671155e-05, "loss": 0.0587, "step": 77070 }, { "epoch": 1.94, "learning_rate": 9.519382961083335e-05, "loss": 0.0657, "step": 77080 }, { "epoch": 1.94, "learning_rate": 9.481697359495515e-05, "loss": 0.0587, "step": 77090 }, { "epoch": 1.94, "learning_rate": 9.444011757907696e-05, "loss": 0.0648, "step": 77100 }, { "epoch": 1.94, "learning_rate": 9.406326156319876e-05, "loss": 0.063, "step": 77110 }, { "epoch": 1.94, "learning_rate": 9.368640554732055e-05, "loss": 0.0626, "step": 77120 }, { "epoch": 1.94, "learning_rate": 9.330954953144236e-05, "loss": 0.0587, "step": 77130 }, { "epoch": 1.94, "learning_rate": 9.293269351556415e-05, "loss": 0.0593, "step": 77140 }, { "epoch": 1.94, "learning_rate": 9.255583749968596e-05, "loss": 0.0608, "step": 77150 }, { "epoch": 1.94, "learning_rate": 9.217898148380776e-05, "loss": 0.0601, "step": 77160 }, { "epoch": 1.94, "learning_rate": 9.180212546792956e-05, "loss": 0.0618, "step": 77170 }, { "epoch": 1.94, "learning_rate": 9.142526945205136e-05, "loss": 0.0609, "step": 77180 }, { "epoch": 1.94, "learning_rate": 9.104841343617315e-05, "loss": 0.0617, "step": 77190 }, { "epoch": 1.94, "learning_rate": 9.067155742029495e-05, "loss": 0.0606, "step": 77200 }, { "epoch": 1.94, "learning_rate": 9.029470140441675e-05, "loss": 0.0592, "step": 77210 }, { "epoch": 1.94, "learning_rate": 8.991784538853855e-05, "loss": 0.0589, "step": 77220 }, { "epoch": 1.94, "learning_rate": 8.954098937266035e-05, "loss": 0.0596, "step": 77230 }, { "epoch": 1.94, "learning_rate": 8.916413335678216e-05, "loss": 0.0613, "step": 77240 }, { "epoch": 1.94, "learning_rate": 8.878727734090395e-05, "loss": 0.0617, "step": 77250 }, { "epoch": 1.94, "learning_rate": 8.841042132502576e-05, "loss": 0.0619, "step": 77260 }, { "epoch": 1.94, "learning_rate": 8.803356530914756e-05, "loss": 0.0617, "step": 77270 }, { "epoch": 1.94, "learning_rate": 8.765670929326936e-05, "loss": 0.0625, "step": 77280 }, { "epoch": 1.94, "learning_rate": 8.727985327739116e-05, "loss": 0.059, "step": 77290 }, { "epoch": 1.94, "learning_rate": 8.690299726151296e-05, "loss": 0.0642, "step": 77300 }, { "epoch": 1.94, "learning_rate": 8.652614124563475e-05, "loss": 0.0595, "step": 77310 }, { "epoch": 1.94, "learning_rate": 8.614928522975655e-05, "loss": 0.06, "step": 77320 }, { "epoch": 1.94, "learning_rate": 8.577242921387835e-05, "loss": 0.0631, "step": 77330 }, { "epoch": 1.94, "learning_rate": 8.539557319800015e-05, "loss": 0.0612, "step": 77340 }, { "epoch": 1.94, "learning_rate": 8.501871718212195e-05, "loss": 0.06, "step": 77350 }, { "epoch": 1.94, "learning_rate": 8.464186116624375e-05, "loss": 0.061, "step": 77360 }, { "epoch": 1.94, "learning_rate": 8.426500515036555e-05, "loss": 0.0617, "step": 77370 }, { "epoch": 1.94, "learning_rate": 8.388814913448736e-05, "loss": 0.0589, "step": 77380 }, { "epoch": 1.94, "learning_rate": 8.351129311860914e-05, "loss": 0.0638, "step": 77390 }, { "epoch": 1.94, "learning_rate": 8.313443710273096e-05, "loss": 0.0593, "step": 77400 }, { "epoch": 1.94, "learning_rate": 8.275758108685276e-05, "loss": 0.0609, "step": 77410 }, { "epoch": 1.95, "learning_rate": 8.238072507097455e-05, "loss": 0.0622, "step": 77420 }, { "epoch": 1.95, "learning_rate": 8.200386905509635e-05, "loss": 0.0592, "step": 77430 }, { "epoch": 1.95, "learning_rate": 8.162701303921815e-05, "loss": 0.0613, "step": 77440 }, { "epoch": 1.95, "learning_rate": 8.125015702333995e-05, "loss": 0.0625, "step": 77450 }, { "epoch": 1.95, "learning_rate": 8.087330100746175e-05, "loss": 0.0615, "step": 77460 }, { "epoch": 1.95, "learning_rate": 8.049644499158355e-05, "loss": 0.0609, "step": 77470 }, { "epoch": 1.95, "learning_rate": 8.011958897570535e-05, "loss": 0.0612, "step": 77480 }, { "epoch": 1.95, "learning_rate": 7.974273295982716e-05, "loss": 0.0612, "step": 77490 }, { "epoch": 1.95, "learning_rate": 7.936587694394895e-05, "loss": 0.0627, "step": 77500 }, { "epoch": 1.95, "eval_cer": 0.6651560846522654, "eval_loss": 0.05267711356282234, "eval_runtime": 90.8378, "eval_samples_per_second": 110.075, "eval_steps_per_second": 6.88, "step": 77500 }, { "epoch": 1.95, "learning_rate": 7.898902092807074e-05, "loss": 0.0632, "step": 77510 }, { "epoch": 1.95, "learning_rate": 7.861216491219256e-05, "loss": 0.0586, "step": 77520 }, { "epoch": 1.95, "learning_rate": 7.823530889631434e-05, "loss": 0.0614, "step": 77530 }, { "epoch": 1.95, "learning_rate": 7.785845288043615e-05, "loss": 0.0623, "step": 77540 }, { "epoch": 1.95, "learning_rate": 7.748159686455795e-05, "loss": 0.0626, "step": 77550 }, { "epoch": 1.95, "learning_rate": 7.710474084867975e-05, "loss": 0.0603, "step": 77560 }, { "epoch": 1.95, "learning_rate": 7.672788483280155e-05, "loss": 0.0623, "step": 77570 }, { "epoch": 1.95, "learning_rate": 7.635102881692335e-05, "loss": 0.063, "step": 77580 }, { "epoch": 1.95, "learning_rate": 7.597417280104515e-05, "loss": 0.0625, "step": 77590 }, { "epoch": 1.95, "learning_rate": 7.559731678516695e-05, "loss": 0.0582, "step": 77600 }, { "epoch": 1.95, "learning_rate": 7.522046076928875e-05, "loss": 0.0616, "step": 77610 }, { "epoch": 1.95, "learning_rate": 7.484360475341055e-05, "loss": 0.0619, "step": 77620 }, { "epoch": 1.95, "learning_rate": 7.446674873753236e-05, "loss": 0.0604, "step": 77630 }, { "epoch": 1.95, "learning_rate": 7.408989272165414e-05, "loss": 0.0649, "step": 77640 }, { "epoch": 1.95, "learning_rate": 7.371303670577596e-05, "loss": 0.0632, "step": 77650 }, { "epoch": 1.95, "learning_rate": 7.333618068989775e-05, "loss": 0.06, "step": 77660 }, { "epoch": 1.95, "learning_rate": 7.295932467401954e-05, "loss": 0.059, "step": 77670 }, { "epoch": 1.95, "learning_rate": 7.258246865814135e-05, "loss": 0.0617, "step": 77680 }, { "epoch": 1.95, "learning_rate": 7.220561264226314e-05, "loss": 0.0604, "step": 77690 }, { "epoch": 1.95, "learning_rate": 7.182875662638495e-05, "loss": 0.0627, "step": 77700 }, { "epoch": 1.95, "learning_rate": 7.145190061050675e-05, "loss": 0.0601, "step": 77710 }, { "epoch": 1.95, "learning_rate": 7.107504459462855e-05, "loss": 0.0644, "step": 77720 }, { "epoch": 1.95, "learning_rate": 7.069818857875035e-05, "loss": 0.0596, "step": 77730 }, { "epoch": 1.95, "learning_rate": 7.032133256287214e-05, "loss": 0.0626, "step": 77740 }, { "epoch": 1.95, "learning_rate": 6.994447654699394e-05, "loss": 0.0589, "step": 77750 }, { "epoch": 1.95, "learning_rate": 6.956762053111574e-05, "loss": 0.0616, "step": 77760 }, { "epoch": 1.95, "learning_rate": 6.919076451523755e-05, "loss": 0.062, "step": 77770 }, { "epoch": 1.95, "learning_rate": 6.881390849935934e-05, "loss": 0.0619, "step": 77780 }, { "epoch": 1.95, "learning_rate": 6.843705248348115e-05, "loss": 0.0602, "step": 77790 }, { "epoch": 1.95, "learning_rate": 6.806019646760295e-05, "loss": 0.0604, "step": 77800 }, { "epoch": 1.95, "learning_rate": 6.768334045172475e-05, "loss": 0.0636, "step": 77810 }, { "epoch": 1.96, "learning_rate": 6.730648443584655e-05, "loss": 0.0588, "step": 77820 }, { "epoch": 1.96, "learning_rate": 6.692962841996833e-05, "loss": 0.0653, "step": 77830 }, { "epoch": 1.96, "learning_rate": 6.655277240409015e-05, "loss": 0.0624, "step": 77840 }, { "epoch": 1.96, "learning_rate": 6.617591638821195e-05, "loss": 0.0609, "step": 77850 }, { "epoch": 1.96, "learning_rate": 6.579906037233374e-05, "loss": 0.0611, "step": 77860 }, { "epoch": 1.96, "learning_rate": 6.542220435645554e-05, "loss": 0.0619, "step": 77870 }, { "epoch": 1.96, "learning_rate": 6.504534834057734e-05, "loss": 0.0622, "step": 77880 }, { "epoch": 1.96, "learning_rate": 6.466849232469914e-05, "loss": 0.0595, "step": 77890 }, { "epoch": 1.96, "learning_rate": 6.429163630882094e-05, "loss": 0.0605, "step": 77900 }, { "epoch": 1.96, "learning_rate": 6.391478029294275e-05, "loss": 0.0599, "step": 77910 }, { "epoch": 1.96, "learning_rate": 6.353792427706454e-05, "loss": 0.0602, "step": 77920 }, { "epoch": 1.96, "learning_rate": 6.316106826118635e-05, "loss": 0.0633, "step": 77930 }, { "epoch": 1.96, "learning_rate": 6.278421224530815e-05, "loss": 0.0625, "step": 77940 }, { "epoch": 1.96, "learning_rate": 6.240735622942995e-05, "loss": 0.06, "step": 77950 }, { "epoch": 1.96, "learning_rate": 6.203050021355175e-05, "loss": 0.059, "step": 77960 }, { "epoch": 1.96, "learning_rate": 6.165364419767355e-05, "loss": 0.0586, "step": 77970 }, { "epoch": 1.96, "learning_rate": 6.127678818179534e-05, "loss": 0.0617, "step": 77980 }, { "epoch": 1.96, "learning_rate": 6.089993216591715e-05, "loss": 0.0621, "step": 77990 }, { "epoch": 1.96, "learning_rate": 6.052307615003894e-05, "loss": 0.0607, "step": 78000 }, { "epoch": 1.96, "eval_cer": 0.6651161425346498, "eval_loss": 0.052589353173971176, "eval_runtime": 90.6912, "eval_samples_per_second": 110.253, "eval_steps_per_second": 6.892, "step": 78000 }, { "epoch": 1.96, "learning_rate": 6.014622013416074e-05, "loss": 0.0597, "step": 78010 }, { "epoch": 1.96, "learning_rate": 5.9769364118282546e-05, "loss": 0.0611, "step": 78020 }, { "epoch": 1.96, "learning_rate": 5.939250810240434e-05, "loss": 0.0614, "step": 78030 }, { "epoch": 1.96, "learning_rate": 5.9015652086526144e-05, "loss": 0.062, "step": 78040 }, { "epoch": 1.96, "learning_rate": 5.863879607064795e-05, "loss": 0.0651, "step": 78050 }, { "epoch": 1.96, "learning_rate": 5.826194005476974e-05, "loss": 0.0595, "step": 78060 }, { "epoch": 1.96, "learning_rate": 5.788508403889155e-05, "loss": 0.0611, "step": 78070 }, { "epoch": 1.96, "learning_rate": 5.750822802301334e-05, "loss": 0.063, "step": 78080 }, { "epoch": 1.96, "learning_rate": 5.713137200713514e-05, "loss": 0.0613, "step": 78090 }, { "epoch": 1.96, "learning_rate": 5.6754515991256943e-05, "loss": 0.0603, "step": 78100 }, { "epoch": 1.96, "learning_rate": 5.6377659975378736e-05, "loss": 0.0592, "step": 78110 }, { "epoch": 1.96, "learning_rate": 5.600080395950054e-05, "loss": 0.0621, "step": 78120 }, { "epoch": 1.96, "learning_rate": 5.562394794362235e-05, "loss": 0.0623, "step": 78130 }, { "epoch": 1.96, "learning_rate": 5.524709192774414e-05, "loss": 0.06, "step": 78140 }, { "epoch": 1.96, "learning_rate": 5.4870235911865944e-05, "loss": 0.0623, "step": 78150 }, { "epoch": 1.96, "learning_rate": 5.449337989598774e-05, "loss": 0.0603, "step": 78160 }, { "epoch": 1.96, "learning_rate": 5.4116523880109535e-05, "loss": 0.0575, "step": 78170 }, { "epoch": 1.96, "learning_rate": 5.373966786423134e-05, "loss": 0.0605, "step": 78180 }, { "epoch": 1.96, "learning_rate": 5.3362811848353147e-05, "loss": 0.0585, "step": 78190 }, { "epoch": 1.96, "learning_rate": 5.298595583247494e-05, "loss": 0.0596, "step": 78200 }, { "epoch": 1.96, "learning_rate": 5.2609099816596744e-05, "loss": 0.0609, "step": 78210 }, { "epoch": 1.97, "learning_rate": 5.2232243800718536e-05, "loss": 0.0582, "step": 78220 }, { "epoch": 1.97, "learning_rate": 5.185538778484034e-05, "loss": 0.0607, "step": 78230 }, { "epoch": 1.97, "learning_rate": 5.147853176896214e-05, "loss": 0.0582, "step": 78240 }, { "epoch": 1.97, "learning_rate": 5.110167575308393e-05, "loss": 0.0598, "step": 78250 }, { "epoch": 1.97, "learning_rate": 5.072481973720574e-05, "loss": 0.0581, "step": 78260 }, { "epoch": 1.97, "learning_rate": 5.0347963721327544e-05, "loss": 0.0578, "step": 78270 }, { "epoch": 1.97, "learning_rate": 4.9971107705449336e-05, "loss": 0.0608, "step": 78280 }, { "epoch": 1.97, "learning_rate": 4.959425168957114e-05, "loss": 0.0587, "step": 78290 }, { "epoch": 1.97, "learning_rate": 4.921739567369294e-05, "loss": 0.0607, "step": 78300 }, { "epoch": 1.97, "learning_rate": 4.884053965781474e-05, "loss": 0.0617, "step": 78310 }, { "epoch": 1.97, "learning_rate": 4.846368364193654e-05, "loss": 0.0616, "step": 78320 }, { "epoch": 1.97, "learning_rate": 4.808682762605833e-05, "loss": 0.0586, "step": 78330 }, { "epoch": 1.97, "learning_rate": 4.7709971610180136e-05, "loss": 0.0585, "step": 78340 }, { "epoch": 1.97, "learning_rate": 4.733311559430194e-05, "loss": 0.0597, "step": 78350 }, { "epoch": 1.97, "learning_rate": 4.6956259578423734e-05, "loss": 0.0604, "step": 78360 }, { "epoch": 1.97, "learning_rate": 4.657940356254554e-05, "loss": 0.0638, "step": 78370 }, { "epoch": 1.97, "learning_rate": 4.620254754666734e-05, "loss": 0.0605, "step": 78380 }, { "epoch": 1.97, "learning_rate": 4.582569153078914e-05, "loss": 0.0664, "step": 78390 }, { "epoch": 1.97, "learning_rate": 4.5448835514910936e-05, "loss": 0.0597, "step": 78400 }, { "epoch": 1.97, "learning_rate": 4.5071979499032734e-05, "loss": 0.061, "step": 78410 }, { "epoch": 1.97, "learning_rate": 4.469512348315453e-05, "loss": 0.0616, "step": 78420 }, { "epoch": 1.97, "learning_rate": 4.431826746727634e-05, "loss": 0.0611, "step": 78430 }, { "epoch": 1.97, "learning_rate": 4.394141145139814e-05, "loss": 0.0631, "step": 78440 }, { "epoch": 1.97, "learning_rate": 4.3564555435519937e-05, "loss": 0.0592, "step": 78450 }, { "epoch": 1.97, "learning_rate": 4.3187699419641735e-05, "loss": 0.0617, "step": 78460 }, { "epoch": 1.97, "learning_rate": 4.2810843403763534e-05, "loss": 0.0619, "step": 78470 }, { "epoch": 1.97, "learning_rate": 4.243398738788533e-05, "loss": 0.0592, "step": 78480 }, { "epoch": 1.97, "learning_rate": 4.205713137200713e-05, "loss": 0.0607, "step": 78490 }, { "epoch": 1.97, "learning_rate": 4.168027535612894e-05, "loss": 0.0607, "step": 78500 }, { "epoch": 1.97, "eval_cer": 0.6651493474276073, "eval_loss": 0.052500005811452866, "eval_runtime": 91.3787, "eval_samples_per_second": 109.424, "eval_steps_per_second": 6.84, "step": 78500 }, { "epoch": 1.97, "learning_rate": 4.1303419340250736e-05, "loss": 0.0597, "step": 78510 }, { "epoch": 1.97, "learning_rate": 4.0926563324372535e-05, "loss": 0.061, "step": 78520 }, { "epoch": 1.97, "learning_rate": 4.054970730849434e-05, "loss": 0.0643, "step": 78530 }, { "epoch": 1.97, "learning_rate": 4.017285129261613e-05, "loss": 0.0577, "step": 78540 }, { "epoch": 1.97, "learning_rate": 3.979599527673793e-05, "loss": 0.06, "step": 78550 }, { "epoch": 1.97, "learning_rate": 3.941913926085973e-05, "loss": 0.0619, "step": 78560 }, { "epoch": 1.97, "learning_rate": 3.9042283244981536e-05, "loss": 0.0619, "step": 78570 }, { "epoch": 1.97, "learning_rate": 3.8665427229103335e-05, "loss": 0.0575, "step": 78580 }, { "epoch": 1.97, "learning_rate": 3.8288571213225134e-05, "loss": 0.0604, "step": 78590 }, { "epoch": 1.97, "learning_rate": 3.791171519734694e-05, "loss": 0.0616, "step": 78600 }, { "epoch": 1.97, "learning_rate": 3.753485918146874e-05, "loss": 0.0618, "step": 78610 }, { "epoch": 1.98, "learning_rate": 3.715800316559053e-05, "loss": 0.0605, "step": 78620 }, { "epoch": 1.98, "learning_rate": 3.678114714971233e-05, "loss": 0.059, "step": 78630 }, { "epoch": 1.98, "learning_rate": 3.6404291133834135e-05, "loss": 0.0624, "step": 78640 }, { "epoch": 1.98, "learning_rate": 3.6027435117955934e-05, "loss": 0.0597, "step": 78650 }, { "epoch": 1.98, "learning_rate": 3.565057910207773e-05, "loss": 0.0596, "step": 78660 }, { "epoch": 1.98, "learning_rate": 3.527372308619954e-05, "loss": 0.0583, "step": 78670 }, { "epoch": 1.98, "learning_rate": 3.489686707032134e-05, "loss": 0.0632, "step": 78680 }, { "epoch": 1.98, "learning_rate": 3.4520011054443136e-05, "loss": 0.0659, "step": 78690 }, { "epoch": 1.98, "learning_rate": 3.414315503856493e-05, "loss": 0.0619, "step": 78700 }, { "epoch": 1.98, "learning_rate": 3.3766299022686733e-05, "loss": 0.0598, "step": 78710 }, { "epoch": 1.98, "learning_rate": 3.338944300680853e-05, "loss": 0.0597, "step": 78720 }, { "epoch": 1.98, "learning_rate": 3.301258699093033e-05, "loss": 0.06, "step": 78730 }, { "epoch": 1.98, "learning_rate": 3.263573097505213e-05, "loss": 0.0583, "step": 78740 }, { "epoch": 1.98, "learning_rate": 3.2258874959173936e-05, "loss": 0.0622, "step": 78750 }, { "epoch": 1.98, "learning_rate": 3.1882018943295734e-05, "loss": 0.0592, "step": 78760 }, { "epoch": 1.98, "learning_rate": 3.150516292741753e-05, "loss": 0.0594, "step": 78770 }, { "epoch": 1.98, "learning_rate": 3.112830691153933e-05, "loss": 0.0605, "step": 78780 }, { "epoch": 1.98, "learning_rate": 3.075145089566113e-05, "loss": 0.0601, "step": 78790 }, { "epoch": 1.98, "learning_rate": 3.037459487978293e-05, "loss": 0.0599, "step": 78800 }, { "epoch": 1.98, "learning_rate": 2.999773886390473e-05, "loss": 0.0599, "step": 78810 }, { "epoch": 1.98, "learning_rate": 2.9620882848026534e-05, "loss": 0.0627, "step": 78820 }, { "epoch": 1.98, "learning_rate": 2.924402683214833e-05, "loss": 0.0586, "step": 78830 }, { "epoch": 1.98, "learning_rate": 2.886717081627013e-05, "loss": 0.0597, "step": 78840 }, { "epoch": 1.98, "learning_rate": 2.8490314800391934e-05, "loss": 0.0602, "step": 78850 }, { "epoch": 1.98, "learning_rate": 2.8113458784513733e-05, "loss": 0.0621, "step": 78860 }, { "epoch": 1.98, "learning_rate": 2.773660276863553e-05, "loss": 0.0617, "step": 78870 }, { "epoch": 1.98, "learning_rate": 2.7359746752757327e-05, "loss": 0.0595, "step": 78880 }, { "epoch": 1.98, "learning_rate": 2.6982890736879133e-05, "loss": 0.0631, "step": 78890 }, { "epoch": 1.98, "learning_rate": 2.660603472100093e-05, "loss": 0.0568, "step": 78900 }, { "epoch": 1.98, "learning_rate": 2.6229178705122727e-05, "loss": 0.0623, "step": 78910 }, { "epoch": 1.98, "learning_rate": 2.5852322689244533e-05, "loss": 0.0615, "step": 78920 }, { "epoch": 1.98, "learning_rate": 2.547546667336633e-05, "loss": 0.0599, "step": 78930 }, { "epoch": 1.98, "learning_rate": 2.509861065748813e-05, "loss": 0.0592, "step": 78940 }, { "epoch": 1.98, "learning_rate": 2.4721754641609926e-05, "loss": 0.0628, "step": 78950 }, { "epoch": 1.98, "learning_rate": 2.434489862573173e-05, "loss": 0.0603, "step": 78960 }, { "epoch": 1.98, "learning_rate": 2.396804260985353e-05, "loss": 0.0597, "step": 78970 }, { "epoch": 1.98, "learning_rate": 2.359118659397533e-05, "loss": 0.0591, "step": 78980 }, { "epoch": 1.98, "learning_rate": 2.3214330578097128e-05, "loss": 0.0617, "step": 78990 }, { "epoch": 1.98, "learning_rate": 2.283747456221893e-05, "loss": 0.0608, "step": 79000 }, { "epoch": 1.98, "eval_cer": 0.6651329855962949, "eval_loss": 0.0524982325732708, "eval_runtime": 90.4461, "eval_samples_per_second": 110.552, "eval_steps_per_second": 6.91, "step": 79000 }, { "epoch": 1.98, "learning_rate": 2.246061854634073e-05, "loss": 0.0608, "step": 79010 }, { "epoch": 1.99, "learning_rate": 2.2083762530462528e-05, "loss": 0.0595, "step": 79020 }, { "epoch": 1.99, "learning_rate": 2.1706906514584327e-05, "loss": 0.0613, "step": 79030 }, { "epoch": 1.99, "learning_rate": 2.133005049870613e-05, "loss": 0.0617, "step": 79040 }, { "epoch": 1.99, "learning_rate": 2.0953194482827928e-05, "loss": 0.0616, "step": 79050 }, { "epoch": 1.99, "learning_rate": 2.0576338466949727e-05, "loss": 0.0573, "step": 79060 }, { "epoch": 1.99, "learning_rate": 2.0199482451071525e-05, "loss": 0.0622, "step": 79070 }, { "epoch": 1.99, "learning_rate": 1.9822626435193328e-05, "loss": 0.0612, "step": 79080 }, { "epoch": 1.99, "learning_rate": 1.944577041931513e-05, "loss": 0.0601, "step": 79090 }, { "epoch": 1.99, "learning_rate": 1.9068914403436925e-05, "loss": 0.0604, "step": 79100 }, { "epoch": 1.99, "learning_rate": 1.8692058387558728e-05, "loss": 0.0615, "step": 79110 }, { "epoch": 1.99, "learning_rate": 1.8315202371680526e-05, "loss": 0.062, "step": 79120 }, { "epoch": 1.99, "learning_rate": 1.793834635580233e-05, "loss": 0.0617, "step": 79130 }, { "epoch": 1.99, "learning_rate": 1.7561490339924124e-05, "loss": 0.0614, "step": 79140 }, { "epoch": 1.99, "learning_rate": 1.7184634324045926e-05, "loss": 0.0594, "step": 79150 }, { "epoch": 1.99, "learning_rate": 1.680777830816773e-05, "loss": 0.0623, "step": 79160 }, { "epoch": 1.99, "learning_rate": 1.6430922292289527e-05, "loss": 0.057, "step": 79170 }, { "epoch": 1.99, "learning_rate": 1.6054066276411326e-05, "loss": 0.061, "step": 79180 }, { "epoch": 1.99, "learning_rate": 1.5677210260533125e-05, "loss": 0.0611, "step": 79190 }, { "epoch": 1.99, "learning_rate": 1.5300354244654927e-05, "loss": 0.0583, "step": 79200 }, { "epoch": 1.99, "learning_rate": 1.4923498228776724e-05, "loss": 0.0612, "step": 79210 }, { "epoch": 1.99, "learning_rate": 1.4546642212898525e-05, "loss": 0.0616, "step": 79220 }, { "epoch": 1.99, "learning_rate": 1.4169786197020324e-05, "loss": 0.0598, "step": 79230 }, { "epoch": 1.99, "learning_rate": 1.3792930181142124e-05, "loss": 0.0588, "step": 79240 }, { "epoch": 1.99, "learning_rate": 1.3416074165263927e-05, "loss": 0.059, "step": 79250 }, { "epoch": 1.99, "learning_rate": 1.3039218149385725e-05, "loss": 0.0625, "step": 79260 }, { "epoch": 1.99, "learning_rate": 1.2662362133507526e-05, "loss": 0.0611, "step": 79270 }, { "epoch": 1.99, "learning_rate": 1.2285506117629325e-05, "loss": 0.0597, "step": 79280 }, { "epoch": 1.99, "learning_rate": 1.1908650101751125e-05, "loss": 0.0572, "step": 79290 }, { "epoch": 1.99, "learning_rate": 1.1531794085872924e-05, "loss": 0.0631, "step": 79300 }, { "epoch": 1.99, "learning_rate": 1.1154938069994725e-05, "loss": 0.0641, "step": 79310 }, { "epoch": 1.99, "learning_rate": 1.0778082054116523e-05, "loss": 0.0587, "step": 79320 }, { "epoch": 1.99, "learning_rate": 1.0401226038238324e-05, "loss": 0.0644, "step": 79330 }, { "epoch": 1.99, "learning_rate": 1.0024370022360123e-05, "loss": 0.0589, "step": 79340 }, { "epoch": 1.99, "learning_rate": 9.647514006481923e-06, "loss": 0.0602, "step": 79350 }, { "epoch": 1.99, "learning_rate": 9.270657990603724e-06, "loss": 0.0591, "step": 79360 }, { "epoch": 1.99, "learning_rate": 8.893801974725524e-06, "loss": 0.0617, "step": 79370 }, { "epoch": 1.99, "learning_rate": 8.516945958847323e-06, "loss": 0.0602, "step": 79380 }, { "epoch": 1.99, "learning_rate": 8.140089942969124e-06, "loss": 0.0613, "step": 79390 }, { "epoch": 1.99, "learning_rate": 7.763233927090923e-06, "loss": 0.0571, "step": 79400 }, { "epoch": 2.0, "learning_rate": 7.386377911212722e-06, "loss": 0.0634, "step": 79410 }, { "epoch": 2.0, "learning_rate": 7.009521895334522e-06, "loss": 0.062, "step": 79420 }, { "epoch": 2.0, "learning_rate": 6.632665879456322e-06, "loss": 0.0641, "step": 79430 }, { "epoch": 2.0, "learning_rate": 6.255809863578123e-06, "loss": 0.0608, "step": 79440 }, { "epoch": 2.0, "learning_rate": 5.878953847699923e-06, "loss": 0.0603, "step": 79450 }, { "epoch": 2.0, "learning_rate": 5.502097831821722e-06, "loss": 0.0619, "step": 79460 }, { "epoch": 2.0, "learning_rate": 5.125241815943522e-06, "loss": 0.0595, "step": 79470 }, { "epoch": 2.0, "learning_rate": 4.748385800065322e-06, "loss": 0.0601, "step": 79480 }, { "epoch": 2.0, "learning_rate": 4.3715297841871215e-06, "loss": 0.0571, "step": 79490 }, { "epoch": 2.0, "learning_rate": 3.994673768308922e-06, "loss": 0.0609, "step": 79500 }, { "epoch": 2.0, "eval_cer": 0.665112292691988, "eval_loss": 0.0524970106780529, "eval_runtime": 90.3409, "eval_samples_per_second": 110.681, "eval_steps_per_second": 6.918, "step": 79500 }, { "epoch": 2.0, "learning_rate": 3.6178177524307217e-06, "loss": 0.0622, "step": 79510 }, { "epoch": 2.0, "learning_rate": 3.2409617365525214e-06, "loss": 0.0615, "step": 79520 }, { "epoch": 2.0, "learning_rate": 2.864105720674321e-06, "loss": 0.0603, "step": 79530 }, { "epoch": 2.0, "learning_rate": 2.4872497047961207e-06, "loss": 0.0585, "step": 79540 }, { "epoch": 2.0, "learning_rate": 2.110393688917921e-06, "loss": 0.0578, "step": 79550 }, { "epoch": 2.0, "learning_rate": 1.7335376730397205e-06, "loss": 0.0584, "step": 79560 }, { "epoch": 2.0, "learning_rate": 1.3566816571615204e-06, "loss": 0.0625, "step": 79570 }, { "epoch": 2.0, "learning_rate": 9.798256412833203e-07, "loss": 0.0624, "step": 79580 }, { "epoch": 2.0, "learning_rate": 6.029696254051202e-07, "loss": 0.0634, "step": 79590 }, { "epoch": 2.0, "learning_rate": 2.261136095269201e-07, "loss": 0.0606, "step": 79600 }, { "epoch": 2.0, "step": 79606, "total_flos": 3.941634629940987e+18, "train_loss": 0.1818607694105572, "train_runtime": 106697.7235, "train_samples_per_second": 191.002, "train_steps_per_second": 0.746 } ], "max_steps": 79606, "num_train_epochs": 2, "total_flos": 3.941634629940987e+18, "trial_name": null, "trial_params": null }