diff --git "a/trainer_state.json" "b/trainer_state.json" --- "a/trainer_state.json" +++ "b/trainer_state.json" @@ -1,8 +1,8 @@ { "best_metric": null, "best_model_checkpoint": null, - "epoch": 12.773065150852645, - "global_step": 14600, + "epoch": 24.146917358985572, + "global_step": 27600, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, @@ -9060,11 +9060,8075 @@ "learning_rate": 0.00020691489361702125, "loss": 0.9234, "step": 14600 + }, + { + "epoch": 12.78, + "learning_rate": 0.00020684840425531912, + "loss": 0.848, + "step": 14610 + }, + { + "epoch": 12.79, + "learning_rate": 0.00020678191489361699, + "loss": 0.8915, + "step": 14620 + }, + { + "epoch": 12.8, + "learning_rate": 0.00020671542553191486, + "loss": 0.9263, + "step": 14630 + }, + { + "epoch": 12.81, + "learning_rate": 0.00020664893617021275, + "loss": 0.7667, + "step": 14640 + }, + { + "epoch": 12.82, + "learning_rate": 0.00020658244680851062, + "loss": 0.9482, + "step": 14650 + }, + { + "epoch": 12.83, + "learning_rate": 0.0002065159574468085, + "loss": 0.9315, + "step": 14660 + }, + { + "epoch": 12.83, + "learning_rate": 0.00020644946808510636, + "loss": 0.8704, + "step": 14670 + }, + { + "epoch": 12.84, + "learning_rate": 0.00020638297872340423, + "loss": 0.905, + "step": 14680 + }, + { + "epoch": 12.85, + "learning_rate": 0.0002063164893617021, + "loss": 1.0015, + "step": 14690 + }, + { + "epoch": 12.86, + "learning_rate": 0.00020624999999999997, + "loss": 1.0181, + "step": 14700 + }, + { + "epoch": 12.87, + "learning_rate": 0.00020618351063829787, + "loss": 0.8935, + "step": 14710 + }, + { + "epoch": 12.88, + "learning_rate": 0.00020611702127659574, + "loss": 1.0126, + "step": 14720 + }, + { + "epoch": 12.89, + "learning_rate": 0.0002060505319148936, + "loss": 1.0019, + "step": 14730 + }, + { + "epoch": 12.9, + "learning_rate": 0.00020598404255319148, + "loss": 0.929, + "step": 14740 + }, + { + "epoch": 12.9, + "learning_rate": 0.00020591755319148935, + "loss": 0.9538, + "step": 14750 + }, + { + "epoch": 12.91, + "learning_rate": 0.00020585106382978722, + "loss": 0.997, + "step": 14760 + }, + { + "epoch": 12.92, + "learning_rate": 0.0002057845744680851, + "loss": 0.9999, + "step": 14770 + }, + { + "epoch": 12.93, + "learning_rate": 0.00020571808510638296, + "loss": 0.8423, + "step": 14780 + }, + { + "epoch": 12.94, + "learning_rate": 0.00020565159574468085, + "loss": 0.878, + "step": 14790 + }, + { + "epoch": 12.95, + "learning_rate": 0.00020558510638297872, + "loss": 0.9586, + "step": 14800 + }, + { + "epoch": 12.96, + "learning_rate": 0.0002055186170212766, + "loss": 0.8543, + "step": 14810 + }, + { + "epoch": 12.97, + "learning_rate": 0.00020545212765957446, + "loss": 0.8633, + "step": 14820 + }, + { + "epoch": 12.97, + "learning_rate": 0.00020538563829787233, + "loss": 0.9061, + "step": 14830 + }, + { + "epoch": 12.98, + "learning_rate": 0.0002053191489361702, + "loss": 0.7897, + "step": 14840 + }, + { + "epoch": 12.99, + "learning_rate": 0.00020525265957446807, + "loss": 0.9661, + "step": 14850 + }, + { + "epoch": 13.0, + "learning_rate": 0.00020518617021276594, + "loss": 0.9375, + "step": 14860 + }, + { + "epoch": 13.01, + "learning_rate": 0.00020511968085106384, + "loss": 0.9073, + "step": 14870 + }, + { + "epoch": 13.02, + "learning_rate": 0.00020505319148936166, + "loss": 0.7484, + "step": 14880 + }, + { + "epoch": 13.03, + "learning_rate": 0.00020498670212765955, + "loss": 0.8098, + "step": 14890 + }, + { + "epoch": 13.04, + "learning_rate": 0.00020492021276595742, + "loss": 0.8629, + "step": 14900 + }, + { + "epoch": 13.04, + "learning_rate": 0.0002048537234042553, + "loss": 0.7741, + "step": 14910 + }, + { + "epoch": 13.05, + "learning_rate": 0.00020478723404255316, + "loss": 0.9069, + "step": 14920 + }, + { + "epoch": 13.06, + "learning_rate": 0.00020472074468085103, + "loss": 0.7353, + "step": 14930 + }, + { + "epoch": 13.07, + "learning_rate": 0.0002046542553191489, + "loss": 0.8632, + "step": 14940 + }, + { + "epoch": 13.08, + "learning_rate": 0.00020458776595744677, + "loss": 0.7818, + "step": 14950 + }, + { + "epoch": 13.09, + "learning_rate": 0.00020452127659574464, + "loss": 0.7384, + "step": 14960 + }, + { + "epoch": 13.1, + "learning_rate": 0.00020445478723404254, + "loss": 0.894, + "step": 14970 + }, + { + "epoch": 13.11, + "learning_rate": 0.0002043882978723404, + "loss": 0.8132, + "step": 14980 + }, + { + "epoch": 13.11, + "learning_rate": 0.00020432180851063828, + "loss": 0.8529, + "step": 14990 + }, + { + "epoch": 13.12, + "learning_rate": 0.00020425531914893615, + "loss": 0.8909, + "step": 15000 + }, + { + "epoch": 13.12, + "eval_cer1": 0.3392187974747645, + "eval_cer2": 0.3177686628383921, + "eval_cer3": 0.2885331590983339, + "eval_cer4": 0.29511574744840463, + "eval_cer5": 0.3207643312101911, + "eval_loss": 1.1855053901672363, + "eval_runtime": 1264.3288, + "eval_samples_per_second": 6.929, + "step": 15000 + }, + { + "epoch": 13.13, + "learning_rate": 0.00020418882978723402, + "loss": 0.7726, + "step": 15010 + }, + { + "epoch": 13.14, + "learning_rate": 0.0002041223404255319, + "loss": 0.8991, + "step": 15020 + }, + { + "epoch": 13.15, + "learning_rate": 0.00020405585106382976, + "loss": 0.8376, + "step": 15030 + }, + { + "epoch": 13.16, + "learning_rate": 0.00020398936170212763, + "loss": 0.9154, + "step": 15040 + }, + { + "epoch": 13.17, + "learning_rate": 0.00020392287234042553, + "loss": 0.7976, + "step": 15050 + }, + { + "epoch": 13.18, + "learning_rate": 0.0002038563829787234, + "loss": 0.697, + "step": 15060 + }, + { + "epoch": 13.18, + "learning_rate": 0.00020378989361702126, + "loss": 0.8543, + "step": 15070 + }, + { + "epoch": 13.19, + "learning_rate": 0.00020372340425531913, + "loss": 0.7901, + "step": 15080 + }, + { + "epoch": 13.2, + "learning_rate": 0.000203656914893617, + "loss": 0.8668, + "step": 15090 + }, + { + "epoch": 13.21, + "learning_rate": 0.00020359042553191487, + "loss": 0.8611, + "step": 15100 + }, + { + "epoch": 13.22, + "learning_rate": 0.00020352393617021274, + "loss": 0.7238, + "step": 15110 + }, + { + "epoch": 13.23, + "learning_rate": 0.00020345744680851061, + "loss": 0.9031, + "step": 15120 + }, + { + "epoch": 13.24, + "learning_rate": 0.0002033909574468085, + "loss": 0.7859, + "step": 15130 + }, + { + "epoch": 13.25, + "learning_rate": 0.00020332446808510638, + "loss": 0.8138, + "step": 15140 + }, + { + "epoch": 13.25, + "learning_rate": 0.00020325797872340425, + "loss": 0.764, + "step": 15150 + }, + { + "epoch": 13.26, + "learning_rate": 0.00020319148936170212, + "loss": 0.7924, + "step": 15160 + }, + { + "epoch": 13.27, + "learning_rate": 0.000203125, + "loss": 0.914, + "step": 15170 + }, + { + "epoch": 13.28, + "learning_rate": 0.00020305851063829786, + "loss": 0.8773, + "step": 15180 + }, + { + "epoch": 13.29, + "learning_rate": 0.00020299202127659573, + "loss": 0.804, + "step": 15190 + }, + { + "epoch": 13.3, + "learning_rate": 0.0002029255319148936, + "loss": 0.8032, + "step": 15200 + }, + { + "epoch": 13.31, + "learning_rate": 0.0002028590425531915, + "loss": 0.7001, + "step": 15210 + }, + { + "epoch": 13.32, + "learning_rate": 0.00020279255319148937, + "loss": 0.8891, + "step": 15220 + }, + { + "epoch": 13.32, + "learning_rate": 0.0002027260638297872, + "loss": 0.8022, + "step": 15230 + }, + { + "epoch": 13.33, + "learning_rate": 0.00020265957446808508, + "loss": 0.8473, + "step": 15240 + }, + { + "epoch": 13.34, + "learning_rate": 0.00020259308510638295, + "loss": 0.8071, + "step": 15250 + }, + { + "epoch": 13.35, + "learning_rate": 0.00020252659574468082, + "loss": 0.7937, + "step": 15260 + }, + { + "epoch": 13.36, + "learning_rate": 0.0002024601063829787, + "loss": 0.8766, + "step": 15270 + }, + { + "epoch": 13.37, + "learning_rate": 0.00020239361702127656, + "loss": 0.7101, + "step": 15280 + }, + { + "epoch": 13.38, + "learning_rate": 0.00020232712765957443, + "loss": 0.8392, + "step": 15290 + }, + { + "epoch": 13.39, + "learning_rate": 0.00020226063829787233, + "loss": 0.8145, + "step": 15300 + }, + { + "epoch": 13.39, + "learning_rate": 0.0002021941489361702, + "loss": 0.7219, + "step": 15310 + }, + { + "epoch": 13.4, + "learning_rate": 0.00020212765957446807, + "loss": 0.8866, + "step": 15320 + }, + { + "epoch": 13.41, + "learning_rate": 0.00020206117021276594, + "loss": 0.8459, + "step": 15330 + }, + { + "epoch": 13.42, + "learning_rate": 0.0002019946808510638, + "loss": 0.8178, + "step": 15340 + }, + { + "epoch": 13.43, + "learning_rate": 0.00020192819148936168, + "loss": 0.893, + "step": 15350 + }, + { + "epoch": 13.44, + "learning_rate": 0.00020186170212765955, + "loss": 0.7521, + "step": 15360 + }, + { + "epoch": 13.45, + "learning_rate": 0.00020179521276595741, + "loss": 0.9168, + "step": 15370 + }, + { + "epoch": 13.46, + "learning_rate": 0.0002017287234042553, + "loss": 0.7176, + "step": 15380 + }, + { + "epoch": 13.46, + "learning_rate": 0.00020166223404255318, + "loss": 0.7773, + "step": 15390 + }, + { + "epoch": 13.47, + "learning_rate": 0.00020159574468085105, + "loss": 0.7758, + "step": 15400 + }, + { + "epoch": 13.48, + "learning_rate": 0.00020152925531914892, + "loss": 0.754, + "step": 15410 + }, + { + "epoch": 13.49, + "learning_rate": 0.0002014627659574468, + "loss": 0.8364, + "step": 15420 + }, + { + "epoch": 13.5, + "learning_rate": 0.00020139627659574466, + "loss": 0.6987, + "step": 15430 + }, + { + "epoch": 13.51, + "learning_rate": 0.00020132978723404253, + "loss": 0.8569, + "step": 15440 + }, + { + "epoch": 13.52, + "learning_rate": 0.0002012632978723404, + "loss": 0.8074, + "step": 15450 + }, + { + "epoch": 13.53, + "learning_rate": 0.0002011968085106383, + "loss": 0.6713, + "step": 15460 + }, + { + "epoch": 13.53, + "learning_rate": 0.00020113031914893617, + "loss": 0.9293, + "step": 15470 + }, + { + "epoch": 13.54, + "learning_rate": 0.00020106382978723404, + "loss": 0.6779, + "step": 15480 + }, + { + "epoch": 13.55, + "learning_rate": 0.0002009973404255319, + "loss": 0.8982, + "step": 15490 + }, + { + "epoch": 13.56, + "learning_rate": 0.00020093085106382978, + "loss": 0.8553, + "step": 15500 + }, + { + "epoch": 13.57, + "learning_rate": 0.00020086436170212765, + "loss": 0.7382, + "step": 15510 + }, + { + "epoch": 13.58, + "learning_rate": 0.00020079787234042552, + "loss": 0.8824, + "step": 15520 + }, + { + "epoch": 13.59, + "learning_rate": 0.0002007313829787234, + "loss": 0.7786, + "step": 15530 + }, + { + "epoch": 13.6, + "learning_rate": 0.00020066489361702128, + "loss": 0.8754, + "step": 15540 + }, + { + "epoch": 13.6, + "learning_rate": 0.00020059840425531915, + "loss": 0.7902, + "step": 15550 + }, + { + "epoch": 13.61, + "learning_rate": 0.00020053191489361702, + "loss": 0.8549, + "step": 15560 + }, + { + "epoch": 13.62, + "learning_rate": 0.0002004654255319149, + "loss": 0.8945, + "step": 15570 + }, + { + "epoch": 13.63, + "learning_rate": 0.00020039893617021276, + "loss": 0.8195, + "step": 15580 + }, + { + "epoch": 13.64, + "learning_rate": 0.0002003324468085106, + "loss": 0.8038, + "step": 15590 + }, + { + "epoch": 13.65, + "learning_rate": 0.00020026595744680848, + "loss": 0.8458, + "step": 15600 + }, + { + "epoch": 13.65, + "eval_cer1": 0.318051382465143, + "eval_cer2": 0.29739130434782607, + "eval_cer3": 0.2697157791571382, + "eval_cer4": 0.2732219324511414, + "eval_cer5": 0.3000424628450106, + "eval_loss": 1.1297023296356201, + "eval_runtime": 1291.5515, + "eval_samples_per_second": 6.783, + "step": 15600 + }, + { + "epoch": 13.66, + "learning_rate": 0.00020019946808510635, + "loss": 0.7666, + "step": 15610 + }, + { + "epoch": 13.67, + "learning_rate": 0.00020013297872340422, + "loss": 0.9345, + "step": 15620 + }, + { + "epoch": 13.67, + "learning_rate": 0.00020006648936170209, + "loss": 0.8501, + "step": 15630 + }, + { + "epoch": 13.68, + "learning_rate": 0.00019999999999999998, + "loss": 0.9028, + "step": 15640 + }, + { + "epoch": 13.69, + "learning_rate": 0.00019993351063829785, + "loss": 0.8467, + "step": 15650 + }, + { + "epoch": 13.7, + "learning_rate": 0.00019986702127659572, + "loss": 0.783, + "step": 15660 + }, + { + "epoch": 13.71, + "learning_rate": 0.0001998005319148936, + "loss": 0.9343, + "step": 15670 + }, + { + "epoch": 13.72, + "learning_rate": 0.00019973404255319146, + "loss": 0.7176, + "step": 15680 + }, + { + "epoch": 13.73, + "learning_rate": 0.00019966755319148933, + "loss": 0.8045, + "step": 15690 + }, + { + "epoch": 13.74, + "learning_rate": 0.0001996010638297872, + "loss": 0.9697, + "step": 15700 + }, + { + "epoch": 13.74, + "learning_rate": 0.00019953457446808507, + "loss": 0.7678, + "step": 15710 + }, + { + "epoch": 13.75, + "learning_rate": 0.00019946808510638297, + "loss": 0.9675, + "step": 15720 + }, + { + "epoch": 13.76, + "learning_rate": 0.00019940159574468084, + "loss": 0.8577, + "step": 15730 + }, + { + "epoch": 13.77, + "learning_rate": 0.0001993351063829787, + "loss": 0.8539, + "step": 15740 + }, + { + "epoch": 13.78, + "learning_rate": 0.00019926861702127658, + "loss": 0.8309, + "step": 15750 + }, + { + "epoch": 13.79, + "learning_rate": 0.00019920212765957445, + "loss": 0.7003, + "step": 15760 + }, + { + "epoch": 13.8, + "learning_rate": 0.00019913563829787232, + "loss": 0.8837, + "step": 15770 + }, + { + "epoch": 13.81, + "learning_rate": 0.0001990691489361702, + "loss": 0.7662, + "step": 15780 + }, + { + "epoch": 13.81, + "learning_rate": 0.00019900265957446806, + "loss": 0.8567, + "step": 15790 + }, + { + "epoch": 13.82, + "learning_rate": 0.00019893617021276595, + "loss": 0.7708, + "step": 15800 + }, + { + "epoch": 13.83, + "learning_rate": 0.00019886968085106382, + "loss": 0.7494, + "step": 15810 + }, + { + "epoch": 13.84, + "learning_rate": 0.0001988031914893617, + "loss": 0.9774, + "step": 15820 + }, + { + "epoch": 13.85, + "learning_rate": 0.00019873670212765956, + "loss": 0.8775, + "step": 15830 + }, + { + "epoch": 13.86, + "learning_rate": 0.00019867021276595743, + "loss": 0.8533, + "step": 15840 + }, + { + "epoch": 13.87, + "learning_rate": 0.0001986037234042553, + "loss": 0.8854, + "step": 15850 + }, + { + "epoch": 13.88, + "learning_rate": 0.00019853723404255317, + "loss": 0.7294, + "step": 15860 + }, + { + "epoch": 13.88, + "learning_rate": 0.00019847074468085107, + "loss": 1.0049, + "step": 15870 + }, + { + "epoch": 13.89, + "learning_rate": 0.00019840425531914894, + "loss": 0.7182, + "step": 15880 + }, + { + "epoch": 13.9, + "learning_rate": 0.0001983377659574468, + "loss": 0.8756, + "step": 15890 + }, + { + "epoch": 13.91, + "learning_rate": 0.00019827127659574468, + "loss": 0.8781, + "step": 15900 + }, + { + "epoch": 13.92, + "learning_rate": 0.00019820478723404255, + "loss": 0.7262, + "step": 15910 + }, + { + "epoch": 13.93, + "learning_rate": 0.00019813829787234042, + "loss": 0.9876, + "step": 15920 + }, + { + "epoch": 13.94, + "learning_rate": 0.0001980718085106383, + "loss": 0.7772, + "step": 15930 + }, + { + "epoch": 13.95, + "learning_rate": 0.00019800531914893613, + "loss": 0.8202, + "step": 15940 + }, + { + "epoch": 13.95, + "learning_rate": 0.000197938829787234, + "loss": 0.8194, + "step": 15950 + }, + { + "epoch": 13.96, + "learning_rate": 0.00019787234042553187, + "loss": 0.7863, + "step": 15960 + }, + { + "epoch": 13.97, + "learning_rate": 0.00019780585106382977, + "loss": 0.8283, + "step": 15970 + }, + { + "epoch": 13.98, + "learning_rate": 0.00019773936170212764, + "loss": 0.7745, + "step": 15980 + }, + { + "epoch": 13.99, + "learning_rate": 0.0001976728723404255, + "loss": 0.8281, + "step": 15990 + }, + { + "epoch": 14.0, + "learning_rate": 0.00019760638297872338, + "loss": 0.7716, + "step": 16000 + }, + { + "epoch": 14.01, + "learning_rate": 0.00019753989361702125, + "loss": 0.8981, + "step": 16010 + }, + { + "epoch": 14.02, + "learning_rate": 0.00019747340425531912, + "loss": 0.7819, + "step": 16020 + }, + { + "epoch": 14.02, + "learning_rate": 0.000197406914893617, + "loss": 0.6779, + "step": 16030 + }, + { + "epoch": 14.03, + "learning_rate": 0.00019734042553191486, + "loss": 0.8303, + "step": 16040 + }, + { + "epoch": 14.04, + "learning_rate": 0.00019727393617021276, + "loss": 0.7213, + "step": 16050 + }, + { + "epoch": 14.05, + "learning_rate": 0.00019720744680851062, + "loss": 0.8114, + "step": 16060 + }, + { + "epoch": 14.06, + "learning_rate": 0.0001971409574468085, + "loss": 0.6867, + "step": 16070 + }, + { + "epoch": 14.07, + "learning_rate": 0.00019707446808510636, + "loss": 0.6972, + "step": 16080 + }, + { + "epoch": 14.08, + "learning_rate": 0.00019700797872340423, + "loss": 0.7685, + "step": 16090 + }, + { + "epoch": 14.09, + "learning_rate": 0.0001969414893617021, + "loss": 0.6985, + "step": 16100 + }, + { + "epoch": 14.09, + "learning_rate": 0.00019687499999999997, + "loss": 0.7939, + "step": 16110 + }, + { + "epoch": 14.1, + "learning_rate": 0.00019680851063829784, + "loss": 0.7735, + "step": 16120 + }, + { + "epoch": 14.11, + "learning_rate": 0.00019674202127659574, + "loss": 0.7357, + "step": 16130 + }, + { + "epoch": 14.12, + "learning_rate": 0.0001966755319148936, + "loss": 0.802, + "step": 16140 + }, + { + "epoch": 14.13, + "learning_rate": 0.00019660904255319148, + "loss": 0.7361, + "step": 16150 + }, + { + "epoch": 14.14, + "learning_rate": 0.00019654255319148935, + "loss": 0.8536, + "step": 16160 + }, + { + "epoch": 14.15, + "learning_rate": 0.00019647606382978722, + "loss": 0.7138, + "step": 16170 + }, + { + "epoch": 14.16, + "learning_rate": 0.0001964095744680851, + "loss": 0.7561, + "step": 16180 + }, + { + "epoch": 14.16, + "learning_rate": 0.00019634308510638296, + "loss": 0.7063, + "step": 16190 + }, + { + "epoch": 14.17, + "learning_rate": 0.00019627659574468083, + "loss": 0.6616, + "step": 16200 + }, + { + "epoch": 14.17, + "eval_cer1": 0.3182201816278991, + "eval_cer2": 0.29486464315012306, + "eval_cer3": 0.2726886638353479, + "eval_cer4": 0.2720306513409962, + "eval_cer5": 0.2932484076433121, + "eval_loss": 1.1143051385879517, + "eval_runtime": 1313.0708, + "eval_samples_per_second": 6.671, + "step": 16200 + }, + { + "epoch": 14.18, + "learning_rate": 0.00019621010638297873, + "loss": 0.7557, + "step": 16210 + }, + { + "epoch": 14.19, + "learning_rate": 0.0001961436170212766, + "loss": 0.6934, + "step": 16220 + }, + { + "epoch": 14.2, + "learning_rate": 0.00019607712765957447, + "loss": 0.7144, + "step": 16230 + }, + { + "epoch": 14.21, + "learning_rate": 0.00019601063829787234, + "loss": 0.8616, + "step": 16240 + }, + { + "epoch": 14.22, + "learning_rate": 0.0001959441489361702, + "loss": 0.682, + "step": 16250 + }, + { + "epoch": 14.23, + "learning_rate": 0.00019587765957446808, + "loss": 0.7682, + "step": 16260 + }, + { + "epoch": 14.23, + "learning_rate": 0.00019581117021276595, + "loss": 0.6824, + "step": 16270 + }, + { + "epoch": 14.24, + "learning_rate": 0.00019574468085106382, + "loss": 0.6424, + "step": 16280 + }, + { + "epoch": 14.25, + "learning_rate": 0.00019567819148936166, + "loss": 0.8398, + "step": 16290 + }, + { + "epoch": 14.26, + "learning_rate": 0.00019561170212765953, + "loss": 0.722, + "step": 16300 + }, + { + "epoch": 14.27, + "learning_rate": 0.00019554521276595743, + "loss": 0.7341, + "step": 16310 + }, + { + "epoch": 14.28, + "learning_rate": 0.0001954787234042553, + "loss": 0.6773, + "step": 16320 + }, + { + "epoch": 14.29, + "learning_rate": 0.00019541223404255317, + "loss": 0.7365, + "step": 16330 + }, + { + "epoch": 14.3, + "learning_rate": 0.00019534574468085104, + "loss": 0.8071, + "step": 16340 + }, + { + "epoch": 14.3, + "learning_rate": 0.0001952792553191489, + "loss": 0.6234, + "step": 16350 + }, + { + "epoch": 14.31, + "learning_rate": 0.00019521276595744677, + "loss": 0.8399, + "step": 16360 + }, + { + "epoch": 14.32, + "learning_rate": 0.00019514627659574464, + "loss": 0.6696, + "step": 16370 + }, + { + "epoch": 14.33, + "learning_rate": 0.00019507978723404254, + "loss": 0.6734, + "step": 16380 + }, + { + "epoch": 14.34, + "learning_rate": 0.0001950132978723404, + "loss": 0.7585, + "step": 16390 + }, + { + "epoch": 14.35, + "learning_rate": 0.00019494680851063828, + "loss": 0.641, + "step": 16400 + }, + { + "epoch": 14.36, + "learning_rate": 0.00019488031914893615, + "loss": 0.7906, + "step": 16410 + }, + { + "epoch": 14.37, + "learning_rate": 0.00019481382978723402, + "loss": 0.791, + "step": 16420 + }, + { + "epoch": 14.37, + "learning_rate": 0.0001947473404255319, + "loss": 0.7852, + "step": 16430 + }, + { + "epoch": 14.38, + "learning_rate": 0.00019468085106382976, + "loss": 0.8255, + "step": 16440 + }, + { + "epoch": 14.39, + "learning_rate": 0.00019461436170212763, + "loss": 0.6949, + "step": 16450 + }, + { + "epoch": 14.4, + "learning_rate": 0.00019454787234042553, + "loss": 0.8579, + "step": 16460 + }, + { + "epoch": 14.41, + "learning_rate": 0.0001944813829787234, + "loss": 0.6611, + "step": 16470 + }, + { + "epoch": 14.42, + "learning_rate": 0.00019441489361702127, + "loss": 0.7366, + "step": 16480 + }, + { + "epoch": 14.43, + "learning_rate": 0.00019434840425531914, + "loss": 0.8814, + "step": 16490 + }, + { + "epoch": 14.44, + "learning_rate": 0.000194281914893617, + "loss": 0.6525, + "step": 16500 + }, + { + "epoch": 14.44, + "learning_rate": 0.00019421542553191488, + "loss": 0.7604, + "step": 16510 + }, + { + "epoch": 14.45, + "learning_rate": 0.00019414893617021275, + "loss": 0.8022, + "step": 16520 + }, + { + "epoch": 14.46, + "learning_rate": 0.00019408244680851062, + "loss": 0.7173, + "step": 16530 + }, + { + "epoch": 14.47, + "learning_rate": 0.00019401595744680851, + "loss": 0.7892, + "step": 16540 + }, + { + "epoch": 14.48, + "learning_rate": 0.00019394946808510638, + "loss": 0.6637, + "step": 16550 + }, + { + "epoch": 14.49, + "learning_rate": 0.00019388297872340425, + "loss": 0.8382, + "step": 16560 + }, + { + "epoch": 14.5, + "learning_rate": 0.00019381648936170212, + "loss": 0.7502, + "step": 16570 + }, + { + "epoch": 14.51, + "learning_rate": 0.00019375, + "loss": 0.7276, + "step": 16580 + }, + { + "epoch": 14.51, + "learning_rate": 0.00019368351063829786, + "loss": 0.8077, + "step": 16590 + }, + { + "epoch": 14.52, + "learning_rate": 0.00019361702127659573, + "loss": 0.6857, + "step": 16600 + }, + { + "epoch": 14.53, + "learning_rate": 0.0001935505319148936, + "loss": 0.7267, + "step": 16610 + }, + { + "epoch": 14.54, + "learning_rate": 0.0001934840425531915, + "loss": 0.7215, + "step": 16620 + }, + { + "epoch": 14.55, + "learning_rate": 0.00019341755319148937, + "loss": 0.779, + "step": 16630 + }, + { + "epoch": 14.56, + "learning_rate": 0.0001933510638297872, + "loss": 0.7738, + "step": 16640 + }, + { + "epoch": 14.57, + "learning_rate": 0.00019328457446808508, + "loss": 0.6824, + "step": 16650 + }, + { + "epoch": 14.58, + "learning_rate": 0.00019321808510638295, + "loss": 0.8226, + "step": 16660 + }, + { + "epoch": 14.58, + "learning_rate": 0.00019315159574468082, + "loss": 0.7909, + "step": 16670 + }, + { + "epoch": 14.59, + "learning_rate": 0.0001930851063829787, + "loss": 0.7064, + "step": 16680 + }, + { + "epoch": 14.6, + "learning_rate": 0.00019301861702127656, + "loss": 0.8026, + "step": 16690 + }, + { + "epoch": 14.61, + "learning_rate": 0.00019295212765957443, + "loss": 0.6652, + "step": 16700 + }, + { + "epoch": 14.62, + "learning_rate": 0.0001928856382978723, + "loss": 0.7503, + "step": 16710 + }, + { + "epoch": 14.63, + "learning_rate": 0.0001928191489361702, + "loss": 0.7841, + "step": 16720 + }, + { + "epoch": 14.64, + "learning_rate": 0.00019275265957446807, + "loss": 0.7588, + "step": 16730 + }, + { + "epoch": 14.65, + "learning_rate": 0.00019268617021276594, + "loss": 0.7842, + "step": 16740 + }, + { + "epoch": 14.65, + "learning_rate": 0.0001926196808510638, + "loss": 0.7365, + "step": 16750 + }, + { + "epoch": 14.66, + "learning_rate": 0.00019255319148936168, + "loss": 0.7845, + "step": 16760 + }, + { + "epoch": 14.67, + "learning_rate": 0.00019248670212765955, + "loss": 0.7154, + "step": 16770 + }, + { + "epoch": 14.68, + "learning_rate": 0.00019242021276595742, + "loss": 0.7513, + "step": 16780 + }, + { + "epoch": 14.69, + "learning_rate": 0.0001923537234042553, + "loss": 0.8221, + "step": 16790 + }, + { + "epoch": 14.7, + "learning_rate": 0.00019228723404255318, + "loss": 0.6601, + "step": 16800 + }, + { + "epoch": 14.7, + "eval_cer1": 0.30674183856048076, + "eval_cer2": 0.284954881050041, + "eval_cer3": 0.263312642927148, + "eval_cer4": 0.25776747480601436, + "eval_cer5": 0.2816135881104034, + "eval_loss": 1.0925976037979126, + "eval_runtime": 1292.5314, + "eval_samples_per_second": 6.777, + "step": 16800 + }, + { + "epoch": 14.71, + "learning_rate": 0.00019222074468085105, + "loss": 0.7836, + "step": 16810 + }, + { + "epoch": 14.72, + "learning_rate": 0.00019215425531914892, + "loss": 0.7487, + "step": 16820 + }, + { + "epoch": 14.72, + "learning_rate": 0.0001920877659574468, + "loss": 0.7906, + "step": 16830 + }, + { + "epoch": 14.73, + "learning_rate": 0.00019202127659574466, + "loss": 0.7396, + "step": 16840 + }, + { + "epoch": 14.74, + "learning_rate": 0.00019195478723404253, + "loss": 0.7204, + "step": 16850 + }, + { + "epoch": 14.75, + "learning_rate": 0.0001918882978723404, + "loss": 0.848, + "step": 16860 + }, + { + "epoch": 14.76, + "learning_rate": 0.00019182180851063827, + "loss": 0.7929, + "step": 16870 + }, + { + "epoch": 14.77, + "learning_rate": 0.00019175531914893617, + "loss": 0.7217, + "step": 16880 + }, + { + "epoch": 14.78, + "learning_rate": 0.00019168882978723404, + "loss": 0.8023, + "step": 16890 + }, + { + "epoch": 14.79, + "learning_rate": 0.0001916223404255319, + "loss": 0.7387, + "step": 16900 + }, + { + "epoch": 14.79, + "learning_rate": 0.00019155585106382978, + "loss": 0.804, + "step": 16910 + }, + { + "epoch": 14.8, + "learning_rate": 0.00019148936170212765, + "loss": 0.6628, + "step": 16920 + }, + { + "epoch": 14.81, + "learning_rate": 0.00019142287234042552, + "loss": 0.7611, + "step": 16930 + }, + { + "epoch": 14.82, + "learning_rate": 0.0001913563829787234, + "loss": 0.7139, + "step": 16940 + }, + { + "epoch": 14.83, + "learning_rate": 0.00019128989361702126, + "loss": 0.5858, + "step": 16950 + }, + { + "epoch": 14.84, + "learning_rate": 0.00019122340425531916, + "loss": 0.8531, + "step": 16960 + }, + { + "epoch": 14.85, + "learning_rate": 0.00019115691489361703, + "loss": 0.6779, + "step": 16970 + }, + { + "epoch": 14.86, + "learning_rate": 0.0001910904255319149, + "loss": 0.6848, + "step": 16980 + }, + { + "epoch": 14.86, + "learning_rate": 0.00019102393617021277, + "loss": 0.753, + "step": 16990 + }, + { + "epoch": 14.87, + "learning_rate": 0.0001909574468085106, + "loss": 0.6832, + "step": 17000 + }, + { + "epoch": 14.88, + "learning_rate": 0.00019089095744680848, + "loss": 0.812, + "step": 17010 + }, + { + "epoch": 14.89, + "learning_rate": 0.00019082446808510635, + "loss": 0.7017, + "step": 17020 + }, + { + "epoch": 14.9, + "learning_rate": 0.00019075797872340422, + "loss": 0.713, + "step": 17030 + }, + { + "epoch": 14.91, + "learning_rate": 0.0001906914893617021, + "loss": 0.8505, + "step": 17040 + }, + { + "epoch": 14.92, + "learning_rate": 0.00019062499999999998, + "loss": 0.7393, + "step": 17050 + }, + { + "epoch": 14.93, + "learning_rate": 0.00019055851063829785, + "loss": 0.8676, + "step": 17060 + }, + { + "epoch": 14.93, + "learning_rate": 0.00019049202127659572, + "loss": 0.6599, + "step": 17070 + }, + { + "epoch": 14.94, + "learning_rate": 0.0001904255319148936, + "loss": 0.808, + "step": 17080 + }, + { + "epoch": 14.95, + "learning_rate": 0.00019035904255319146, + "loss": 0.7492, + "step": 17090 + }, + { + "epoch": 14.96, + "learning_rate": 0.00019029255319148933, + "loss": 0.6244, + "step": 17100 + }, + { + "epoch": 14.97, + "learning_rate": 0.0001902260638297872, + "loss": 0.7312, + "step": 17110 + }, + { + "epoch": 14.98, + "learning_rate": 0.00019015957446808507, + "loss": 0.7036, + "step": 17120 + }, + { + "epoch": 14.99, + "learning_rate": 0.00019009308510638297, + "loss": 0.6583, + "step": 17130 + }, + { + "epoch": 15.0, + "learning_rate": 0.00019002659574468084, + "loss": 0.7847, + "step": 17140 + }, + { + "epoch": 15.0, + "learning_rate": 0.0001899601063829787, + "loss": 0.7587, + "step": 17150 + }, + { + "epoch": 15.01, + "learning_rate": 0.00018989361702127658, + "loss": 0.5985, + "step": 17160 + }, + { + "epoch": 15.02, + "learning_rate": 0.00018982712765957445, + "loss": 0.5428, + "step": 17170 + }, + { + "epoch": 15.03, + "learning_rate": 0.00018976063829787232, + "loss": 0.7111, + "step": 17180 + }, + { + "epoch": 15.04, + "learning_rate": 0.0001896941489361702, + "loss": 0.6093, + "step": 17190 + }, + { + "epoch": 15.05, + "learning_rate": 0.00018962765957446806, + "loss": 0.7919, + "step": 17200 + }, + { + "epoch": 15.06, + "learning_rate": 0.00018956117021276596, + "loss": 0.6537, + "step": 17210 + }, + { + "epoch": 15.07, + "learning_rate": 0.00018949468085106383, + "loss": 0.5033, + "step": 17220 + }, + { + "epoch": 15.07, + "learning_rate": 0.0001894281914893617, + "loss": 0.7868, + "step": 17230 + }, + { + "epoch": 15.08, + "learning_rate": 0.00018936170212765957, + "loss": 0.6799, + "step": 17240 + }, + { + "epoch": 15.09, + "learning_rate": 0.00018929521276595744, + "loss": 0.6626, + "step": 17250 + }, + { + "epoch": 15.1, + "learning_rate": 0.0001892287234042553, + "loss": 0.6801, + "step": 17260 + }, + { + "epoch": 15.11, + "learning_rate": 0.00018916223404255318, + "loss": 0.6047, + "step": 17270 + }, + { + "epoch": 15.12, + "learning_rate": 0.00018909574468085105, + "loss": 0.7759, + "step": 17280 + }, + { + "epoch": 15.13, + "learning_rate": 0.00018902925531914894, + "loss": 0.6011, + "step": 17290 + }, + { + "epoch": 15.14, + "learning_rate": 0.0001889627659574468, + "loss": 0.6787, + "step": 17300 + }, + { + "epoch": 15.14, + "learning_rate": 0.00018889627659574468, + "loss": 0.7185, + "step": 17310 + }, + { + "epoch": 15.15, + "learning_rate": 0.00018882978723404255, + "loss": 0.5043, + "step": 17320 + }, + { + "epoch": 15.16, + "learning_rate": 0.00018876329787234042, + "loss": 0.7851, + "step": 17330 + }, + { + "epoch": 15.17, + "learning_rate": 0.0001886968085106383, + "loss": 0.6158, + "step": 17340 + }, + { + "epoch": 15.18, + "learning_rate": 0.00018863031914893613, + "loss": 0.6477, + "step": 17350 + }, + { + "epoch": 15.19, + "learning_rate": 0.000188563829787234, + "loss": 0.6485, + "step": 17360 + }, + { + "epoch": 15.2, + "learning_rate": 0.00018849734042553187, + "loss": 0.5675, + "step": 17370 + }, + { + "epoch": 15.21, + "learning_rate": 0.00018843085106382974, + "loss": 0.774, + "step": 17380 + }, + { + "epoch": 15.21, + "learning_rate": 0.00018836436170212764, + "loss": 0.6351, + "step": 17390 + }, + { + "epoch": 15.22, + "learning_rate": 0.0001882978723404255, + "loss": 0.7172, + "step": 17400 + }, + { + "epoch": 15.22, + "eval_cer1": 0.32098848789710005, + "eval_cer2": 0.29401148482362593, + "eval_cer3": 0.26703691604050966, + "eval_cer4": 0.2685212015840819, + "eval_cer5": 0.2905307855626327, + "eval_loss": 1.1153998374938965, + "eval_runtime": 1299.1031, + "eval_samples_per_second": 6.743, + "step": 17400 + }, + { + "epoch": 15.23, + "learning_rate": 0.00018823138297872338, + "loss": 0.6856, + "step": 17410 + }, + { + "epoch": 15.24, + "learning_rate": 0.00018816489361702125, + "loss": 0.5883, + "step": 17420 + }, + { + "epoch": 15.25, + "learning_rate": 0.00018809840425531912, + "loss": 0.8231, + "step": 17430 + }, + { + "epoch": 15.26, + "learning_rate": 0.000188031914893617, + "loss": 0.6704, + "step": 17440 + }, + { + "epoch": 15.27, + "learning_rate": 0.00018796542553191486, + "loss": 0.7344, + "step": 17450 + }, + { + "epoch": 15.28, + "learning_rate": 0.00018789893617021273, + "loss": 0.7718, + "step": 17460 + }, + { + "epoch": 15.28, + "learning_rate": 0.00018783244680851063, + "loss": 0.5414, + "step": 17470 + }, + { + "epoch": 15.29, + "learning_rate": 0.0001877659574468085, + "loss": 0.7694, + "step": 17480 + }, + { + "epoch": 15.3, + "learning_rate": 0.00018769946808510637, + "loss": 0.5456, + "step": 17490 + }, + { + "epoch": 15.31, + "learning_rate": 0.00018763297872340424, + "loss": 0.6698, + "step": 17500 + }, + { + "epoch": 15.32, + "learning_rate": 0.0001875664893617021, + "loss": 0.697, + "step": 17510 + }, + { + "epoch": 15.33, + "learning_rate": 0.00018749999999999998, + "loss": 0.5647, + "step": 17520 + }, + { + "epoch": 15.34, + "learning_rate": 0.00018743351063829785, + "loss": 0.8236, + "step": 17530 + }, + { + "epoch": 15.35, + "learning_rate": 0.00018736702127659574, + "loss": 0.6323, + "step": 17540 + }, + { + "epoch": 15.35, + "learning_rate": 0.0001873005319148936, + "loss": 0.6286, + "step": 17550 + }, + { + "epoch": 15.36, + "learning_rate": 0.00018723404255319148, + "loss": 0.7415, + "step": 17560 + }, + { + "epoch": 15.37, + "learning_rate": 0.00018716755319148935, + "loss": 0.5495, + "step": 17570 + }, + { + "epoch": 15.38, + "learning_rate": 0.00018710106382978722, + "loss": 0.7731, + "step": 17580 + }, + { + "epoch": 15.39, + "learning_rate": 0.0001870345744680851, + "loss": 0.7555, + "step": 17590 + }, + { + "epoch": 15.4, + "learning_rate": 0.00018696808510638296, + "loss": 0.6797, + "step": 17600 + }, + { + "epoch": 15.41, + "learning_rate": 0.00018690159574468083, + "loss": 0.7008, + "step": 17610 + }, + { + "epoch": 15.42, + "learning_rate": 0.00018683510638297873, + "loss": 0.5672, + "step": 17620 + }, + { + "epoch": 15.42, + "learning_rate": 0.0001867686170212766, + "loss": 0.8127, + "step": 17630 + }, + { + "epoch": 15.43, + "learning_rate": 0.00018670212765957447, + "loss": 0.6467, + "step": 17640 + }, + { + "epoch": 15.44, + "learning_rate": 0.00018663563829787234, + "loss": 0.6344, + "step": 17650 + }, + { + "epoch": 15.45, + "learning_rate": 0.0001865691489361702, + "loss": 0.6963, + "step": 17660 + }, + { + "epoch": 15.46, + "learning_rate": 0.00018650265957446808, + "loss": 0.6144, + "step": 17670 + }, + { + "epoch": 15.47, + "learning_rate": 0.00018643617021276595, + "loss": 0.803, + "step": 17680 + }, + { + "epoch": 15.48, + "learning_rate": 0.00018636968085106382, + "loss": 0.6167, + "step": 17690 + }, + { + "epoch": 15.49, + "learning_rate": 0.00018630319148936166, + "loss": 0.6992, + "step": 17700 + }, + { + "epoch": 15.49, + "learning_rate": 0.00018623670212765953, + "loss": 0.6766, + "step": 17710 + }, + { + "epoch": 15.5, + "learning_rate": 0.00018617021276595743, + "loss": 0.6609, + "step": 17720 + }, + { + "epoch": 15.51, + "learning_rate": 0.0001861037234042553, + "loss": 0.8435, + "step": 17730 + }, + { + "epoch": 15.52, + "learning_rate": 0.00018603723404255317, + "loss": 0.6471, + "step": 17740 + }, + { + "epoch": 15.53, + "learning_rate": 0.00018597074468085104, + "loss": 0.8128, + "step": 17750 + }, + { + "epoch": 15.54, + "learning_rate": 0.0001859042553191489, + "loss": 0.6071, + "step": 17760 + }, + { + "epoch": 15.55, + "learning_rate": 0.00018583776595744678, + "loss": 0.5639, + "step": 17770 + }, + { + "epoch": 15.56, + "learning_rate": 0.00018577127659574465, + "loss": 0.8204, + "step": 17780 + }, + { + "epoch": 15.56, + "learning_rate": 0.00018570478723404252, + "loss": 0.6363, + "step": 17790 + }, + { + "epoch": 15.57, + "learning_rate": 0.00018563829787234041, + "loss": 0.631, + "step": 17800 + }, + { + "epoch": 15.58, + "learning_rate": 0.00018557180851063828, + "loss": 0.6795, + "step": 17810 + }, + { + "epoch": 15.59, + "learning_rate": 0.00018550531914893615, + "loss": 0.6171, + "step": 17820 + }, + { + "epoch": 15.6, + "learning_rate": 0.00018543882978723402, + "loss": 0.7451, + "step": 17830 + }, + { + "epoch": 15.61, + "learning_rate": 0.0001853723404255319, + "loss": 0.6931, + "step": 17840 + }, + { + "epoch": 15.62, + "learning_rate": 0.00018530585106382976, + "loss": 0.6954, + "step": 17850 + }, + { + "epoch": 15.63, + "learning_rate": 0.00018523936170212763, + "loss": 0.6735, + "step": 17860 + }, + { + "epoch": 15.63, + "learning_rate": 0.0001851728723404255, + "loss": 0.6475, + "step": 17870 + }, + { + "epoch": 15.64, + "learning_rate": 0.0001851063829787234, + "loss": 0.7984, + "step": 17880 + }, + { + "epoch": 15.65, + "learning_rate": 0.00018503989361702127, + "loss": 0.6117, + "step": 17890 + }, + { + "epoch": 15.66, + "learning_rate": 0.00018497340425531914, + "loss": 0.6654, + "step": 17900 + }, + { + "epoch": 15.67, + "learning_rate": 0.000184906914893617, + "loss": 0.73, + "step": 17910 + }, + { + "epoch": 15.68, + "learning_rate": 0.00018484042553191488, + "loss": 0.581, + "step": 17920 + }, + { + "epoch": 15.69, + "learning_rate": 0.00018477393617021275, + "loss": 0.7893, + "step": 17930 + }, + { + "epoch": 15.7, + "learning_rate": 0.00018470744680851062, + "loss": 0.6546, + "step": 17940 + }, + { + "epoch": 15.7, + "learning_rate": 0.0001846409574468085, + "loss": 0.6815, + "step": 17950 + }, + { + "epoch": 15.71, + "learning_rate": 0.00018457446808510639, + "loss": 0.7303, + "step": 17960 + }, + { + "epoch": 15.72, + "learning_rate": 0.00018450797872340426, + "loss": 0.5565, + "step": 17970 + }, + { + "epoch": 15.73, + "learning_rate": 0.00018444148936170213, + "loss": 0.8111, + "step": 17980 + }, + { + "epoch": 15.74, + "learning_rate": 0.000184375, + "loss": 0.6269, + "step": 17990 + }, + { + "epoch": 15.75, + "learning_rate": 0.00018430851063829787, + "loss": 0.7702, + "step": 18000 + }, + { + "epoch": 15.75, + "eval_cer1": 0.31433780088450763, + "eval_cer2": 0.29043478260869565, + "eval_cer3": 0.2632799738647501, + "eval_cer4": 0.26745870762097945, + "eval_cer5": 0.29265392781316346, + "eval_loss": 1.0847606658935547, + "eval_runtime": 1306.6216, + "eval_samples_per_second": 6.704, + "step": 18000 + }, + { + "epoch": 15.76, + "learning_rate": 0.00018424202127659574, + "loss": 0.7008, + "step": 18010 + }, + { + "epoch": 15.77, + "learning_rate": 0.0001841755319148936, + "loss": 0.6327, + "step": 18020 + }, + { + "epoch": 15.77, + "learning_rate": 0.00018410904255319148, + "loss": 0.8075, + "step": 18030 + }, + { + "epoch": 15.78, + "learning_rate": 0.00018404255319148937, + "loss": 0.5853, + "step": 18040 + }, + { + "epoch": 15.79, + "learning_rate": 0.00018397606382978721, + "loss": 0.7004, + "step": 18050 + }, + { + "epoch": 15.8, + "learning_rate": 0.00018390957446808508, + "loss": 0.6902, + "step": 18060 + }, + { + "epoch": 15.81, + "learning_rate": 0.00018384308510638295, + "loss": 0.6421, + "step": 18070 + }, + { + "epoch": 15.82, + "learning_rate": 0.00018377659574468082, + "loss": 0.7945, + "step": 18080 + }, + { + "epoch": 15.83, + "learning_rate": 0.0001837101063829787, + "loss": 0.6051, + "step": 18090 + }, + { + "epoch": 15.84, + "learning_rate": 0.00018364361702127656, + "loss": 0.7038, + "step": 18100 + }, + { + "epoch": 15.84, + "learning_rate": 0.00018357712765957443, + "loss": 0.6985, + "step": 18110 + }, + { + "epoch": 15.85, + "learning_rate": 0.0001835106382978723, + "loss": 0.6688, + "step": 18120 + }, + { + "epoch": 15.86, + "learning_rate": 0.0001834441489361702, + "loss": 0.7827, + "step": 18130 + }, + { + "epoch": 15.87, + "learning_rate": 0.00018337765957446807, + "loss": 0.6242, + "step": 18140 + }, + { + "epoch": 15.88, + "learning_rate": 0.00018331117021276594, + "loss": 0.6931, + "step": 18150 + }, + { + "epoch": 15.89, + "learning_rate": 0.0001832446808510638, + "loss": 0.7222, + "step": 18160 + }, + { + "epoch": 15.9, + "learning_rate": 0.00018317819148936168, + "loss": 0.628, + "step": 18170 + }, + { + "epoch": 15.91, + "learning_rate": 0.00018311170212765955, + "loss": 0.7439, + "step": 18180 + }, + { + "epoch": 15.91, + "learning_rate": 0.00018304521276595742, + "loss": 0.6832, + "step": 18190 + }, + { + "epoch": 15.92, + "learning_rate": 0.0001829787234042553, + "loss": 0.7124, + "step": 18200 + }, + { + "epoch": 15.93, + "learning_rate": 0.0001829122340425532, + "loss": 0.6517, + "step": 18210 + }, + { + "epoch": 15.94, + "learning_rate": 0.00018284574468085106, + "loss": 0.5765, + "step": 18220 + }, + { + "epoch": 15.95, + "learning_rate": 0.00018277925531914893, + "loss": 0.8116, + "step": 18230 + }, + { + "epoch": 15.96, + "learning_rate": 0.0001827127659574468, + "loss": 0.6687, + "step": 18240 + }, + { + "epoch": 15.97, + "learning_rate": 0.00018264627659574467, + "loss": 0.7591, + "step": 18250 + }, + { + "epoch": 15.98, + "learning_rate": 0.00018257978723404254, + "loss": 0.7089, + "step": 18260 + }, + { + "epoch": 15.98, + "learning_rate": 0.0001825132978723404, + "loss": 0.6328, + "step": 18270 + }, + { + "epoch": 15.99, + "learning_rate": 0.00018244680851063828, + "loss": 0.7318, + "step": 18280 + }, + { + "epoch": 16.0, + "learning_rate": 0.00018238031914893617, + "loss": 0.6638, + "step": 18290 + }, + { + "epoch": 16.01, + "learning_rate": 0.00018231382978723404, + "loss": 0.6638, + "step": 18300 + }, + { + "epoch": 16.02, + "learning_rate": 0.0001822473404255319, + "loss": 0.5222, + "step": 18310 + }, + { + "epoch": 16.03, + "learning_rate": 0.00018218085106382978, + "loss": 0.6836, + "step": 18320 + }, + { + "epoch": 16.04, + "learning_rate": 0.00018211436170212765, + "loss": 0.695, + "step": 18330 + }, + { + "epoch": 16.05, + "learning_rate": 0.00018204787234042552, + "loss": 0.5796, + "step": 18340 + }, + { + "epoch": 16.05, + "learning_rate": 0.0001819813829787234, + "loss": 0.7152, + "step": 18350 + }, + { + "epoch": 16.06, + "learning_rate": 0.00018191489361702126, + "loss": 0.4965, + "step": 18360 + }, + { + "epoch": 16.07, + "learning_rate": 0.00018184840425531916, + "loss": 0.6958, + "step": 18370 + }, + { + "epoch": 16.08, + "learning_rate": 0.00018178191489361703, + "loss": 0.6407, + "step": 18380 + }, + { + "epoch": 16.09, + "learning_rate": 0.0001817154255319149, + "loss": 0.4969, + "step": 18390 + }, + { + "epoch": 16.1, + "learning_rate": 0.00018164893617021277, + "loss": 0.788, + "step": 18400 + }, + { + "epoch": 16.11, + "learning_rate": 0.0001815824468085106, + "loss": 0.5648, + "step": 18410 + }, + { + "epoch": 16.12, + "learning_rate": 0.00018151595744680848, + "loss": 0.6607, + "step": 18420 + }, + { + "epoch": 16.12, + "learning_rate": 0.00018144946808510635, + "loss": 0.5947, + "step": 18430 + }, + { + "epoch": 16.13, + "learning_rate": 0.00018138297872340422, + "loss": 0.6444, + "step": 18440 + }, + { + "epoch": 16.14, + "learning_rate": 0.0001813164893617021, + "loss": 0.7331, + "step": 18450 + }, + { + "epoch": 16.15, + "learning_rate": 0.00018124999999999996, + "loss": 0.5287, + "step": 18460 + }, + { + "epoch": 16.16, + "learning_rate": 0.00018118351063829786, + "loss": 0.7092, + "step": 18470 + }, + { + "epoch": 16.17, + "learning_rate": 0.00018111702127659573, + "loss": 0.5647, + "step": 18480 + }, + { + "epoch": 16.18, + "learning_rate": 0.0001810505319148936, + "loss": 0.5094, + "step": 18490 + }, + { + "epoch": 16.19, + "learning_rate": 0.00018098404255319147, + "loss": 0.6664, + "step": 18500 + }, + { + "epoch": 16.19, + "learning_rate": 0.00018091755319148934, + "loss": 0.5014, + "step": 18510 + }, + { + "epoch": 16.2, + "learning_rate": 0.0001808510638297872, + "loss": 0.6867, + "step": 18520 + }, + { + "epoch": 16.21, + "learning_rate": 0.00018078457446808508, + "loss": 0.5517, + "step": 18530 + }, + { + "epoch": 16.22, + "learning_rate": 0.00018071808510638295, + "loss": 0.5359, + "step": 18540 + }, + { + "epoch": 16.23, + "learning_rate": 0.00018065159574468084, + "loss": 0.661, + "step": 18550 + }, + { + "epoch": 16.24, + "learning_rate": 0.0001805851063829787, + "loss": 0.6095, + "step": 18560 + }, + { + "epoch": 16.25, + "learning_rate": 0.00018051861702127658, + "loss": 0.6484, + "step": 18570 + }, + { + "epoch": 16.26, + "learning_rate": 0.00018045212765957445, + "loss": 0.639, + "step": 18580 + }, + { + "epoch": 16.26, + "learning_rate": 0.00018038563829787232, + "loss": 0.5913, + "step": 18590 + }, + { + "epoch": 16.27, + "learning_rate": 0.0001803191489361702, + "loss": 0.6988, + "step": 18600 + }, + { + "epoch": 16.27, + "eval_cer1": 0.30761959420681273, + "eval_cer2": 0.28213289581624285, + "eval_cer3": 0.25655014701078077, + "eval_cer4": 0.26105154705560385, + "eval_cer5": 0.2865392781316348, + "eval_loss": 1.09721839427948, + "eval_runtime": 1356.4898, + "eval_samples_per_second": 6.458, + "step": 18600 + }, + { + "epoch": 16.28, + "learning_rate": 0.00018025265957446806, + "loss": 0.5915, + "step": 18610 + }, + { + "epoch": 16.29, + "learning_rate": 0.00018018617021276593, + "loss": 0.6926, + "step": 18620 + }, + { + "epoch": 16.3, + "learning_rate": 0.00018011968085106383, + "loss": 0.5834, + "step": 18630 + }, + { + "epoch": 16.31, + "learning_rate": 0.0001800531914893617, + "loss": 0.5907, + "step": 18640 + }, + { + "epoch": 16.32, + "learning_rate": 0.00017998670212765957, + "loss": 0.653, + "step": 18650 + }, + { + "epoch": 16.33, + "learning_rate": 0.00017992021276595744, + "loss": 0.4958, + "step": 18660 + }, + { + "epoch": 16.33, + "learning_rate": 0.0001798537234042553, + "loss": 0.6977, + "step": 18670 + }, + { + "epoch": 16.34, + "learning_rate": 0.00017978723404255318, + "loss": 0.5907, + "step": 18680 + }, + { + "epoch": 16.35, + "learning_rate": 0.00017972074468085105, + "loss": 0.5366, + "step": 18690 + }, + { + "epoch": 16.36, + "learning_rate": 0.00017965425531914895, + "loss": 0.6171, + "step": 18700 + }, + { + "epoch": 16.37, + "learning_rate": 0.00017958776595744682, + "loss": 0.5782, + "step": 18710 + }, + { + "epoch": 16.38, + "learning_rate": 0.00017952127659574469, + "loss": 0.7277, + "step": 18720 + }, + { + "epoch": 16.39, + "learning_rate": 0.00017945478723404256, + "loss": 0.599, + "step": 18730 + }, + { + "epoch": 16.4, + "learning_rate": 0.00017938829787234042, + "loss": 0.6258, + "step": 18740 + }, + { + "epoch": 16.4, + "learning_rate": 0.0001793218085106383, + "loss": 0.7215, + "step": 18750 + }, + { + "epoch": 16.41, + "learning_rate": 0.00017925531914893614, + "loss": 0.6798, + "step": 18760 + }, + { + "epoch": 16.42, + "learning_rate": 0.000179188829787234, + "loss": 0.7162, + "step": 18770 + }, + { + "epoch": 16.43, + "learning_rate": 0.00017912234042553188, + "loss": 0.6553, + "step": 18780 + }, + { + "epoch": 16.44, + "learning_rate": 0.00017905585106382975, + "loss": 0.6856, + "step": 18790 + }, + { + "epoch": 16.45, + "learning_rate": 0.00017898936170212764, + "loss": 0.7643, + "step": 18800 + }, + { + "epoch": 16.46, + "learning_rate": 0.00017892287234042551, + "loss": 0.5566, + "step": 18810 + }, + { + "epoch": 16.47, + "learning_rate": 0.00017885638297872338, + "loss": 0.7172, + "step": 18820 + }, + { + "epoch": 16.47, + "learning_rate": 0.00017878989361702125, + "loss": 0.6327, + "step": 18830 + }, + { + "epoch": 16.48, + "learning_rate": 0.00017872340425531912, + "loss": 0.5931, + "step": 18840 + }, + { + "epoch": 16.49, + "learning_rate": 0.000178656914893617, + "loss": 0.7674, + "step": 18850 + }, + { + "epoch": 16.5, + "learning_rate": 0.00017859042553191486, + "loss": 0.6399, + "step": 18860 + }, + { + "epoch": 16.51, + "learning_rate": 0.00017852393617021273, + "loss": 0.6949, + "step": 18870 + }, + { + "epoch": 16.52, + "learning_rate": 0.00017845744680851063, + "loss": 0.6445, + "step": 18880 + }, + { + "epoch": 16.53, + "learning_rate": 0.0001783909574468085, + "loss": 0.6549, + "step": 18890 + }, + { + "epoch": 16.54, + "learning_rate": 0.00017832446808510637, + "loss": 0.7729, + "step": 18900 + }, + { + "epoch": 16.54, + "learning_rate": 0.00017825797872340424, + "loss": 0.633, + "step": 18910 + }, + { + "epoch": 16.55, + "learning_rate": 0.0001781914893617021, + "loss": 0.6874, + "step": 18920 + }, + { + "epoch": 16.56, + "learning_rate": 0.00017812499999999998, + "loss": 0.6257, + "step": 18930 + }, + { + "epoch": 16.57, + "learning_rate": 0.00017805851063829785, + "loss": 0.5936, + "step": 18940 + }, + { + "epoch": 16.58, + "learning_rate": 0.00017799202127659572, + "loss": 0.641, + "step": 18950 + }, + { + "epoch": 16.59, + "learning_rate": 0.00017792553191489362, + "loss": 0.6255, + "step": 18960 + }, + { + "epoch": 16.6, + "learning_rate": 0.00017785904255319149, + "loss": 0.6819, + "step": 18970 + }, + { + "epoch": 16.61, + "learning_rate": 0.00017779255319148936, + "loss": 0.6004, + "step": 18980 + }, + { + "epoch": 16.61, + "learning_rate": 0.00017772606382978723, + "loss": 0.6377, + "step": 18990 + }, + { + "epoch": 16.62, + "learning_rate": 0.0001776595744680851, + "loss": 0.6806, + "step": 19000 + }, + { + "epoch": 16.63, + "learning_rate": 0.00017759308510638297, + "loss": 0.5278, + "step": 19010 + }, + { + "epoch": 16.64, + "learning_rate": 0.00017752659574468084, + "loss": 0.7199, + "step": 19020 + }, + { + "epoch": 16.65, + "learning_rate": 0.0001774601063829787, + "loss": 0.6461, + "step": 19030 + }, + { + "epoch": 16.66, + "learning_rate": 0.0001773936170212766, + "loss": 0.6685, + "step": 19040 + }, + { + "epoch": 16.67, + "learning_rate": 0.00017732712765957447, + "loss": 0.6724, + "step": 19050 + }, + { + "epoch": 16.68, + "learning_rate": 0.00017726063829787234, + "loss": 0.6025, + "step": 19060 + }, + { + "epoch": 16.68, + "learning_rate": 0.0001771941489361702, + "loss": 0.6563, + "step": 19070 + }, + { + "epoch": 16.69, + "learning_rate": 0.00017712765957446808, + "loss": 0.5758, + "step": 19080 + }, + { + "epoch": 16.7, + "learning_rate": 0.00017706117021276595, + "loss": 0.6007, + "step": 19090 + }, + { + "epoch": 16.71, + "learning_rate": 0.00017699468085106382, + "loss": 0.6902, + "step": 19100 + }, + { + "epoch": 16.72, + "learning_rate": 0.00017692819148936166, + "loss": 0.5635, + "step": 19110 + }, + { + "epoch": 16.73, + "learning_rate": 0.00017686170212765953, + "loss": 0.6664, + "step": 19120 + }, + { + "epoch": 16.74, + "learning_rate": 0.0001767952127659574, + "loss": 0.6562, + "step": 19130 + }, + { + "epoch": 16.75, + "learning_rate": 0.0001767287234042553, + "loss": 0.5369, + "step": 19140 + }, + { + "epoch": 16.75, + "learning_rate": 0.00017666223404255317, + "loss": 0.6635, + "step": 19150 + }, + { + "epoch": 16.76, + "learning_rate": 0.00017659574468085104, + "loss": 0.5872, + "step": 19160 + }, + { + "epoch": 16.77, + "learning_rate": 0.0001765292553191489, + "loss": 0.6556, + "step": 19170 + }, + { + "epoch": 16.78, + "learning_rate": 0.00017646276595744678, + "loss": 0.6334, + "step": 19180 + }, + { + "epoch": 16.79, + "learning_rate": 0.00017639627659574465, + "loss": 0.5418, + "step": 19190 + }, + { + "epoch": 16.8, + "learning_rate": 0.00017632978723404252, + "loss": 0.7411, + "step": 19200 + }, + { + "epoch": 16.8, + "eval_cer1": 0.30410857162148475, + "eval_cer2": 0.2792780968006563, + "eval_cer3": 0.25354459327017315, + "eval_cer4": 0.2581860330339032, + "eval_cer5": 0.2791507430997877, + "eval_loss": 1.0727698802947998, + "eval_runtime": 1267.8518, + "eval_samples_per_second": 6.909, + "step": 19200 + }, + { + "epoch": 16.81, + "learning_rate": 0.00017626329787234042, + "loss": 0.4841, + "step": 19210 + }, + { + "epoch": 16.82, + "learning_rate": 0.0001761968085106383, + "loss": 0.7058, + "step": 19220 + }, + { + "epoch": 16.82, + "learning_rate": 0.00017613031914893616, + "loss": 0.6341, + "step": 19230 + }, + { + "epoch": 16.83, + "learning_rate": 0.00017606382978723403, + "loss": 0.539, + "step": 19240 + }, + { + "epoch": 16.84, + "learning_rate": 0.0001759973404255319, + "loss": 0.6752, + "step": 19250 + }, + { + "epoch": 16.85, + "learning_rate": 0.00017593085106382977, + "loss": 0.6126, + "step": 19260 + }, + { + "epoch": 16.86, + "learning_rate": 0.00017586436170212764, + "loss": 0.6215, + "step": 19270 + }, + { + "epoch": 16.87, + "learning_rate": 0.0001757978723404255, + "loss": 0.6387, + "step": 19280 + }, + { + "epoch": 16.88, + "learning_rate": 0.0001757313829787234, + "loss": 0.5976, + "step": 19290 + }, + { + "epoch": 16.89, + "learning_rate": 0.00017566489361702127, + "loss": 0.6805, + "step": 19300 + }, + { + "epoch": 16.89, + "learning_rate": 0.00017559840425531914, + "loss": 0.5206, + "step": 19310 + }, + { + "epoch": 16.9, + "learning_rate": 0.000175531914893617, + "loss": 0.663, + "step": 19320 + }, + { + "epoch": 16.91, + "learning_rate": 0.00017546542553191488, + "loss": 0.6756, + "step": 19330 + }, + { + "epoch": 16.92, + "learning_rate": 0.00017539893617021275, + "loss": 0.5813, + "step": 19340 + }, + { + "epoch": 16.93, + "learning_rate": 0.00017533244680851062, + "loss": 0.6291, + "step": 19350 + }, + { + "epoch": 16.94, + "learning_rate": 0.0001752659574468085, + "loss": 0.5561, + "step": 19360 + }, + { + "epoch": 16.95, + "learning_rate": 0.0001751994680851064, + "loss": 0.6612, + "step": 19370 + }, + { + "epoch": 16.95, + "learning_rate": 0.00017513297872340426, + "loss": 0.6275, + "step": 19380 + }, + { + "epoch": 16.96, + "learning_rate": 0.00017506648936170213, + "loss": 0.6135, + "step": 19390 + }, + { + "epoch": 16.97, + "learning_rate": 0.000175, + "loss": 0.6872, + "step": 19400 + }, + { + "epoch": 16.98, + "learning_rate": 0.00017493351063829787, + "loss": 0.5953, + "step": 19410 + }, + { + "epoch": 16.99, + "learning_rate": 0.00017486702127659574, + "loss": 0.6236, + "step": 19420 + }, + { + "epoch": 17.0, + "learning_rate": 0.0001748005319148936, + "loss": 0.5999, + "step": 19430 + }, + { + "epoch": 17.01, + "learning_rate": 0.00017473404255319148, + "loss": 0.7181, + "step": 19440 + }, + { + "epoch": 17.02, + "learning_rate": 0.00017466755319148937, + "loss": 0.4609, + "step": 19450 + }, + { + "epoch": 17.03, + "learning_rate": 0.0001746010638297872, + "loss": 0.5641, + "step": 19460 + }, + { + "epoch": 17.03, + "learning_rate": 0.0001745345744680851, + "loss": 0.6709, + "step": 19470 + }, + { + "epoch": 17.04, + "learning_rate": 0.00017446808510638296, + "loss": 0.5105, + "step": 19480 + }, + { + "epoch": 17.05, + "learning_rate": 0.00017440159574468083, + "loss": 0.691, + "step": 19490 + }, + { + "epoch": 17.06, + "learning_rate": 0.0001743351063829787, + "loss": 0.5724, + "step": 19500 + }, + { + "epoch": 17.07, + "learning_rate": 0.00017426861702127657, + "loss": 0.591, + "step": 19510 + }, + { + "epoch": 17.08, + "learning_rate": 0.00017420212765957444, + "loss": 0.609, + "step": 19520 + }, + { + "epoch": 17.09, + "learning_rate": 0.0001741356382978723, + "loss": 0.438, + "step": 19530 + }, + { + "epoch": 17.1, + "learning_rate": 0.00017406914893617018, + "loss": 0.6271, + "step": 19540 + }, + { + "epoch": 17.1, + "learning_rate": 0.00017400265957446807, + "loss": 0.4815, + "step": 19550 + }, + { + "epoch": 17.11, + "learning_rate": 0.00017393617021276594, + "loss": 0.5926, + "step": 19560 + }, + { + "epoch": 17.12, + "learning_rate": 0.0001738696808510638, + "loss": 0.6588, + "step": 19570 + }, + { + "epoch": 17.13, + "learning_rate": 0.00017380319148936168, + "loss": 0.508, + "step": 19580 + }, + { + "epoch": 17.14, + "learning_rate": 0.00017373670212765955, + "loss": 0.7072, + "step": 19590 + }, + { + "epoch": 17.15, + "learning_rate": 0.00017367021276595742, + "loss": 0.5317, + "step": 19600 + }, + { + "epoch": 17.16, + "learning_rate": 0.0001736037234042553, + "loss": 0.5451, + "step": 19610 + }, + { + "epoch": 17.17, + "learning_rate": 0.00017353723404255316, + "loss": 0.6444, + "step": 19620 + }, + { + "epoch": 17.17, + "learning_rate": 0.00017347074468085106, + "loss": 0.4646, + "step": 19630 + }, + { + "epoch": 17.18, + "learning_rate": 0.00017340425531914893, + "loss": 0.688, + "step": 19640 + }, + { + "epoch": 17.19, + "learning_rate": 0.0001733377659574468, + "loss": 0.5198, + "step": 19650 + }, + { + "epoch": 17.2, + "learning_rate": 0.00017327127659574467, + "loss": 0.5481, + "step": 19660 + }, + { + "epoch": 17.21, + "learning_rate": 0.00017320478723404254, + "loss": 0.6149, + "step": 19670 + }, + { + "epoch": 17.22, + "learning_rate": 0.0001731382978723404, + "loss": 0.4111, + "step": 19680 + }, + { + "epoch": 17.23, + "learning_rate": 0.00017307180851063828, + "loss": 0.6803, + "step": 19690 + }, + { + "epoch": 17.24, + "learning_rate": 0.00017300531914893615, + "loss": 0.5039, + "step": 19700 + }, + { + "epoch": 17.24, + "learning_rate": 0.00017293882978723405, + "loss": 0.5473, + "step": 19710 + }, + { + "epoch": 17.25, + "learning_rate": 0.00017287234042553192, + "loss": 0.6094, + "step": 19720 + }, + { + "epoch": 17.26, + "learning_rate": 0.00017280585106382978, + "loss": 0.4418, + "step": 19730 + }, + { + "epoch": 17.27, + "learning_rate": 0.00017273936170212765, + "loss": 0.6492, + "step": 19740 + }, + { + "epoch": 17.28, + "learning_rate": 0.00017267287234042552, + "loss": 0.4409, + "step": 19750 + }, + { + "epoch": 17.29, + "learning_rate": 0.0001726063829787234, + "loss": 0.6032, + "step": 19760 + }, + { + "epoch": 17.3, + "learning_rate": 0.00017253989361702126, + "loss": 0.6344, + "step": 19770 + }, + { + "epoch": 17.31, + "learning_rate": 0.00017247340425531913, + "loss": 0.4213, + "step": 19780 + }, + { + "epoch": 17.31, + "learning_rate": 0.00017240691489361703, + "loss": 0.6445, + "step": 19790 + }, + { + "epoch": 17.32, + "learning_rate": 0.0001723404255319149, + "loss": 0.5581, + "step": 19800 + }, + { + "epoch": 17.32, + "eval_cer1": 0.293744303028257, + "eval_cer2": 0.27212469237079573, + "eval_cer3": 0.24900359359686378, + "eval_cer4": 0.2519720531890917, + "eval_cer5": 0.27176220806794055, + "eval_loss": 1.0701156854629517, + "eval_runtime": 1280.4428, + "eval_samples_per_second": 6.841, + "step": 19800 + }, + { + "epoch": 17.33, + "learning_rate": 0.00017227393617021277, + "loss": 0.5871, + "step": 19810 + }, + { + "epoch": 17.34, + "learning_rate": 0.00017220744680851061, + "loss": 0.6256, + "step": 19820 + }, + { + "epoch": 17.35, + "learning_rate": 0.00017214095744680848, + "loss": 0.5534, + "step": 19830 + }, + { + "epoch": 17.36, + "learning_rate": 0.00017207446808510635, + "loss": 0.6941, + "step": 19840 + }, + { + "epoch": 17.37, + "learning_rate": 0.00017200797872340422, + "loss": 0.5746, + "step": 19850 + }, + { + "epoch": 17.38, + "learning_rate": 0.0001719414893617021, + "loss": 0.626, + "step": 19860 + }, + { + "epoch": 17.38, + "learning_rate": 0.00017187499999999996, + "loss": 0.5767, + "step": 19870 + }, + { + "epoch": 17.39, + "learning_rate": 0.00017180851063829786, + "loss": 0.4722, + "step": 19880 + }, + { + "epoch": 17.4, + "learning_rate": 0.00017174202127659573, + "loss": 0.6618, + "step": 19890 + }, + { + "epoch": 17.41, + "learning_rate": 0.0001716755319148936, + "loss": 0.5226, + "step": 19900 + }, + { + "epoch": 17.42, + "learning_rate": 0.00017160904255319147, + "loss": 0.5725, + "step": 19910 + }, + { + "epoch": 17.43, + "learning_rate": 0.00017154255319148934, + "loss": 0.5988, + "step": 19920 + }, + { + "epoch": 17.44, + "learning_rate": 0.0001714760638297872, + "loss": 0.4122, + "step": 19930 + }, + { + "epoch": 17.45, + "learning_rate": 0.00017140957446808508, + "loss": 0.7243, + "step": 19940 + }, + { + "epoch": 17.45, + "learning_rate": 0.00017134308510638295, + "loss": 0.6179, + "step": 19950 + }, + { + "epoch": 17.46, + "learning_rate": 0.00017127659574468085, + "loss": 0.6005, + "step": 19960 + }, + { + "epoch": 17.47, + "learning_rate": 0.00017121010638297872, + "loss": 0.5023, + "step": 19970 + }, + { + "epoch": 17.48, + "learning_rate": 0.00017114361702127659, + "loss": 0.4566, + "step": 19980 + }, + { + "epoch": 17.49, + "learning_rate": 0.00017107712765957446, + "loss": 0.6697, + "step": 19990 + }, + { + "epoch": 17.5, + "learning_rate": 0.00017101063829787233, + "loss": 0.5555, + "step": 20000 + }, + { + "epoch": 17.51, + "learning_rate": 0.0001709441489361702, + "loss": 0.5743, + "step": 20010 + }, + { + "epoch": 17.52, + "learning_rate": 0.00017087765957446807, + "loss": 0.675, + "step": 20020 + }, + { + "epoch": 17.52, + "learning_rate": 0.00017081117021276593, + "loss": 0.5662, + "step": 20030 + }, + { + "epoch": 17.53, + "learning_rate": 0.00017074468085106383, + "loss": 0.6109, + "step": 20040 + }, + { + "epoch": 17.54, + "learning_rate": 0.0001706781914893617, + "loss": 0.521, + "step": 20050 + }, + { + "epoch": 17.55, + "learning_rate": 0.00017061170212765957, + "loss": 0.5853, + "step": 20060 + }, + { + "epoch": 17.56, + "learning_rate": 0.00017054521276595744, + "loss": 0.5989, + "step": 20070 + }, + { + "epoch": 17.57, + "learning_rate": 0.0001704787234042553, + "loss": 0.5808, + "step": 20080 + }, + { + "epoch": 17.58, + "learning_rate": 0.00017041223404255318, + "loss": 0.6298, + "step": 20090 + }, + { + "epoch": 17.59, + "learning_rate": 0.00017034574468085105, + "loss": 0.5581, + "step": 20100 + }, + { + "epoch": 17.59, + "learning_rate": 0.00017027925531914892, + "loss": 0.5618, + "step": 20110 + }, + { + "epoch": 17.6, + "learning_rate": 0.00017021276595744682, + "loss": 0.6126, + "step": 20120 + }, + { + "epoch": 17.61, + "learning_rate": 0.0001701462765957447, + "loss": 0.4804, + "step": 20130 + }, + { + "epoch": 17.62, + "learning_rate": 0.00017007978723404256, + "loss": 0.7326, + "step": 20140 + }, + { + "epoch": 17.63, + "learning_rate": 0.00017001329787234043, + "loss": 0.5373, + "step": 20150 + }, + { + "epoch": 17.64, + "learning_rate": 0.0001699468085106383, + "loss": 0.5139, + "step": 20160 + }, + { + "epoch": 17.65, + "learning_rate": 0.00016988031914893614, + "loss": 0.6478, + "step": 20170 + }, + { + "epoch": 17.66, + "learning_rate": 0.000169813829787234, + "loss": 0.474, + "step": 20180 + }, + { + "epoch": 17.66, + "learning_rate": 0.00016974734042553188, + "loss": 0.7799, + "step": 20190 + }, + { + "epoch": 17.67, + "learning_rate": 0.00016968085106382975, + "loss": 0.5146, + "step": 20200 + }, + { + "epoch": 17.68, + "learning_rate": 0.00016961436170212762, + "loss": 0.5379, + "step": 20210 + }, + { + "epoch": 17.69, + "learning_rate": 0.00016954787234042552, + "loss": 0.5497, + "step": 20220 + }, + { + "epoch": 17.7, + "learning_rate": 0.00016948138297872339, + "loss": 0.4726, + "step": 20230 + }, + { + "epoch": 17.71, + "learning_rate": 0.00016941489361702126, + "loss": 0.602, + "step": 20240 + }, + { + "epoch": 17.72, + "learning_rate": 0.00016934840425531913, + "loss": 0.6149, + "step": 20250 + }, + { + "epoch": 17.72, + "learning_rate": 0.000169281914893617, + "loss": 0.607, + "step": 20260 + }, + { + "epoch": 17.73, + "learning_rate": 0.00016921542553191487, + "loss": 0.6173, + "step": 20270 + }, + { + "epoch": 17.74, + "learning_rate": 0.00016914893617021274, + "loss": 0.5137, + "step": 20280 + }, + { + "epoch": 17.75, + "learning_rate": 0.0001690824468085106, + "loss": 0.6965, + "step": 20290 + }, + { + "epoch": 17.76, + "learning_rate": 0.0001690159574468085, + "loss": 0.6567, + "step": 20300 + }, + { + "epoch": 17.77, + "learning_rate": 0.00016894946808510637, + "loss": 0.525, + "step": 20310 + }, + { + "epoch": 17.78, + "learning_rate": 0.00016888297872340424, + "loss": 0.5644, + "step": 20320 + }, + { + "epoch": 17.79, + "learning_rate": 0.0001688164893617021, + "loss": 0.4628, + "step": 20330 + }, + { + "epoch": 17.79, + "learning_rate": 0.00016874999999999998, + "loss": 0.6595, + "step": 20340 + }, + { + "epoch": 17.8, + "learning_rate": 0.00016868351063829785, + "loss": 0.5256, + "step": 20350 + }, + { + "epoch": 17.81, + "learning_rate": 0.00016861702127659572, + "loss": 0.5931, + "step": 20360 + }, + { + "epoch": 17.82, + "learning_rate": 0.00016855053191489362, + "loss": 0.6076, + "step": 20370 + }, + { + "epoch": 17.83, + "learning_rate": 0.0001684840425531915, + "loss": 0.5627, + "step": 20380 + }, + { + "epoch": 17.84, + "learning_rate": 0.00016841755319148936, + "loss": 0.6577, + "step": 20390 + }, + { + "epoch": 17.85, + "learning_rate": 0.00016835106382978723, + "loss": 0.5341, + "step": 20400 + }, + { + "epoch": 17.85, + "eval_cer1": 0.2937105431957058, + "eval_cer2": 0.26989335520918784, + "eval_cer3": 0.2455080039202875, + "eval_cer4": 0.24756109340287838, + "eval_cer5": 0.270828025477707, + "eval_loss": 1.049605369567871, + "eval_runtime": 1274.4878, + "eval_samples_per_second": 6.873, + "step": 20400 + }, + { + "epoch": 17.86, + "learning_rate": 0.0001682845744680851, + "loss": 0.5403, + "step": 20410 + }, + { + "epoch": 17.86, + "learning_rate": 0.00016821808510638297, + "loss": 0.6146, + "step": 20420 + }, + { + "epoch": 17.87, + "learning_rate": 0.00016815159574468084, + "loss": 0.4637, + "step": 20430 + }, + { + "epoch": 17.88, + "learning_rate": 0.0001680851063829787, + "loss": 0.6556, + "step": 20440 + }, + { + "epoch": 17.89, + "learning_rate": 0.0001680186170212766, + "loss": 0.4853, + "step": 20450 + }, + { + "epoch": 17.9, + "learning_rate": 0.00016795212765957447, + "loss": 0.5586, + "step": 20460 + }, + { + "epoch": 17.91, + "learning_rate": 0.00016788563829787234, + "loss": 0.5801, + "step": 20470 + }, + { + "epoch": 17.92, + "learning_rate": 0.00016781914893617021, + "loss": 0.4773, + "step": 20480 + }, + { + "epoch": 17.93, + "learning_rate": 0.00016775265957446808, + "loss": 0.6119, + "step": 20490 + }, + { + "epoch": 17.93, + "learning_rate": 0.00016768617021276595, + "loss": 0.5564, + "step": 20500 + }, + { + "epoch": 17.94, + "learning_rate": 0.00016761968085106382, + "loss": 0.5668, + "step": 20510 + }, + { + "epoch": 17.95, + "learning_rate": 0.00016755319148936167, + "loss": 0.5677, + "step": 20520 + }, + { + "epoch": 17.96, + "learning_rate": 0.00016748670212765954, + "loss": 0.5402, + "step": 20530 + }, + { + "epoch": 17.97, + "learning_rate": 0.0001674202127659574, + "loss": 0.6511, + "step": 20540 + }, + { + "epoch": 17.98, + "learning_rate": 0.0001673537234042553, + "loss": 0.499, + "step": 20550 + }, + { + "epoch": 17.99, + "learning_rate": 0.00016728723404255317, + "loss": 0.5473, + "step": 20560 + }, + { + "epoch": 18.0, + "learning_rate": 0.00016722074468085104, + "loss": 0.5949, + "step": 20570 + }, + { + "epoch": 18.01, + "learning_rate": 0.0001671542553191489, + "loss": 0.5791, + "step": 20580 + }, + { + "epoch": 18.01, + "learning_rate": 0.00016708776595744678, + "loss": 0.5072, + "step": 20590 + }, + { + "epoch": 18.02, + "learning_rate": 0.00016702127659574465, + "loss": 0.458, + "step": 20600 + }, + { + "epoch": 18.03, + "learning_rate": 0.00016695478723404252, + "loss": 0.6587, + "step": 20610 + }, + { + "epoch": 18.04, + "learning_rate": 0.0001668882978723404, + "loss": 0.4883, + "step": 20620 + }, + { + "epoch": 18.05, + "learning_rate": 0.0001668218085106383, + "loss": 0.5607, + "step": 20630 + }, + { + "epoch": 18.06, + "learning_rate": 0.00016675531914893616, + "loss": 0.4844, + "step": 20640 + }, + { + "epoch": 18.07, + "learning_rate": 0.00016668882978723403, + "loss": 0.3625, + "step": 20650 + }, + { + "epoch": 18.08, + "learning_rate": 0.0001666223404255319, + "loss": 0.594, + "step": 20660 + }, + { + "epoch": 18.08, + "learning_rate": 0.00016655585106382977, + "loss": 0.5494, + "step": 20670 + }, + { + "epoch": 18.09, + "learning_rate": 0.00016648936170212764, + "loss": 0.6277, + "step": 20680 + }, + { + "epoch": 18.1, + "learning_rate": 0.0001664228723404255, + "loss": 0.5218, + "step": 20690 + }, + { + "epoch": 18.11, + "learning_rate": 0.00016635638297872338, + "loss": 0.4139, + "step": 20700 + }, + { + "epoch": 18.12, + "learning_rate": 0.00016628989361702128, + "loss": 0.6951, + "step": 20710 + }, + { + "epoch": 18.13, + "learning_rate": 0.00016622340425531914, + "loss": 0.4451, + "step": 20720 + }, + { + "epoch": 18.14, + "learning_rate": 0.00016615691489361701, + "loss": 0.5954, + "step": 20730 + }, + { + "epoch": 18.15, + "learning_rate": 0.00016609042553191488, + "loss": 0.489, + "step": 20740 + }, + { + "epoch": 18.15, + "learning_rate": 0.00016602393617021275, + "loss": 0.4223, + "step": 20750 + }, + { + "epoch": 18.16, + "learning_rate": 0.00016595744680851062, + "loss": 0.6112, + "step": 20760 + }, + { + "epoch": 18.17, + "learning_rate": 0.0001658909574468085, + "loss": 0.5304, + "step": 20770 + }, + { + "epoch": 18.18, + "learning_rate": 0.00016582446808510636, + "loss": 0.5065, + "step": 20780 + }, + { + "epoch": 18.19, + "learning_rate": 0.00016575797872340426, + "loss": 0.4905, + "step": 20790 + }, + { + "epoch": 18.2, + "learning_rate": 0.00016569148936170213, + "loss": 0.5118, + "step": 20800 + }, + { + "epoch": 18.21, + "learning_rate": 0.000165625, + "loss": 0.659, + "step": 20810 + }, + { + "epoch": 18.22, + "learning_rate": 0.00016555851063829787, + "loss": 0.4521, + "step": 20820 + }, + { + "epoch": 18.22, + "learning_rate": 0.00016549202127659574, + "loss": 0.4849, + "step": 20830 + }, + { + "epoch": 18.23, + "learning_rate": 0.0001654255319148936, + "loss": 0.4451, + "step": 20840 + }, + { + "epoch": 18.24, + "learning_rate": 0.00016535904255319148, + "loss": 0.4317, + "step": 20850 + }, + { + "epoch": 18.25, + "learning_rate": 0.00016529255319148935, + "loss": 0.6025, + "step": 20860 + }, + { + "epoch": 18.26, + "learning_rate": 0.0001652260638297872, + "loss": 0.4809, + "step": 20870 + }, + { + "epoch": 18.27, + "learning_rate": 0.0001651595744680851, + "loss": 0.5499, + "step": 20880 + }, + { + "epoch": 18.28, + "learning_rate": 0.00016509308510638296, + "loss": 0.5277, + "step": 20890 + }, + { + "epoch": 18.29, + "learning_rate": 0.00016502659574468083, + "loss": 0.4754, + "step": 20900 + }, + { + "epoch": 18.29, + "learning_rate": 0.0001649601063829787, + "loss": 0.6204, + "step": 20910 + }, + { + "epoch": 18.3, + "learning_rate": 0.00016489361702127657, + "loss": 0.5341, + "step": 20920 + }, + { + "epoch": 18.31, + "learning_rate": 0.00016482712765957444, + "loss": 0.572, + "step": 20930 + }, + { + "epoch": 18.32, + "learning_rate": 0.0001647606382978723, + "loss": 0.5581, + "step": 20940 + }, + { + "epoch": 18.33, + "learning_rate": 0.00016469414893617018, + "loss": 0.5132, + "step": 20950 + }, + { + "epoch": 18.34, + "learning_rate": 0.00016462765957446808, + "loss": 0.6132, + "step": 20960 + }, + { + "epoch": 18.35, + "learning_rate": 0.00016456117021276595, + "loss": 0.4311, + "step": 20970 + }, + { + "epoch": 18.36, + "learning_rate": 0.00016449468085106382, + "loss": 0.5897, + "step": 20980 + }, + { + "epoch": 18.36, + "learning_rate": 0.00016442819148936169, + "loss": 0.52, + "step": 20990 + }, + { + "epoch": 18.37, + "learning_rate": 0.00016436170212765956, + "loss": 0.5028, + "step": 21000 + }, + { + "epoch": 18.37, + "eval_cer1": 0.29526349549306236, + "eval_cer2": 0.26733388022969645, + "eval_cer3": 0.2455733420450833, + "eval_cer4": 0.24488876010174185, + "eval_cer5": 0.2694692144373673, + "eval_loss": 1.0593605041503906, + "eval_runtime": 1289.2115, + "eval_samples_per_second": 6.795, + "step": 21000 + }, + { + "epoch": 18.38, + "learning_rate": 0.00016429521276595743, + "loss": 0.5897, + "step": 21010 + }, + { + "epoch": 18.39, + "learning_rate": 0.0001642287234042553, + "loss": 0.3999, + "step": 21020 + }, + { + "epoch": 18.4, + "learning_rate": 0.00016416223404255316, + "loss": 0.5383, + "step": 21030 + }, + { + "epoch": 18.41, + "learning_rate": 0.00016409574468085106, + "loss": 0.6265, + "step": 21040 + }, + { + "epoch": 18.42, + "learning_rate": 0.00016402925531914893, + "loss": 0.4316, + "step": 21050 + }, + { + "epoch": 18.43, + "learning_rate": 0.0001639627659574468, + "loss": 0.5767, + "step": 21060 + }, + { + "epoch": 18.43, + "learning_rate": 0.00016389627659574467, + "loss": 0.4826, + "step": 21070 + }, + { + "epoch": 18.44, + "learning_rate": 0.00016382978723404254, + "loss": 0.4948, + "step": 21080 + }, + { + "epoch": 18.45, + "learning_rate": 0.0001637632978723404, + "loss": 0.5146, + "step": 21090 + }, + { + "epoch": 18.46, + "learning_rate": 0.00016369680851063828, + "loss": 0.4797, + "step": 21100 + }, + { + "epoch": 18.47, + "learning_rate": 0.00016363031914893615, + "loss": 0.5347, + "step": 21110 + }, + { + "epoch": 18.48, + "learning_rate": 0.00016356382978723405, + "loss": 0.4746, + "step": 21120 + }, + { + "epoch": 18.49, + "learning_rate": 0.00016349734042553192, + "loss": 0.5058, + "step": 21130 + }, + { + "epoch": 18.49, + "learning_rate": 0.0001634308510638298, + "loss": 0.5457, + "step": 21140 + }, + { + "epoch": 18.5, + "learning_rate": 0.00016336436170212766, + "loss": 0.4463, + "step": 21150 + }, + { + "epoch": 18.51, + "learning_rate": 0.00016329787234042553, + "loss": 0.6715, + "step": 21160 + }, + { + "epoch": 18.52, + "learning_rate": 0.0001632313829787234, + "loss": 0.4169, + "step": 21170 + }, + { + "epoch": 18.53, + "learning_rate": 0.00016316489361702127, + "loss": 0.6026, + "step": 21180 + }, + { + "epoch": 18.54, + "learning_rate": 0.00016309840425531914, + "loss": 0.5468, + "step": 21190 + }, + { + "epoch": 18.55, + "learning_rate": 0.00016303191489361703, + "loss": 0.4206, + "step": 21200 + }, + { + "epoch": 18.56, + "learning_rate": 0.0001629654255319149, + "loss": 0.6104, + "step": 21210 + }, + { + "epoch": 18.56, + "learning_rate": 0.00016289893617021277, + "loss": 0.4292, + "step": 21220 + }, + { + "epoch": 18.57, + "learning_rate": 0.00016283244680851062, + "loss": 0.605, + "step": 21230 + }, + { + "epoch": 18.58, + "learning_rate": 0.00016276595744680849, + "loss": 0.4774, + "step": 21240 + }, + { + "epoch": 18.59, + "learning_rate": 0.00016269946808510636, + "loss": 0.506, + "step": 21250 + }, + { + "epoch": 18.6, + "learning_rate": 0.00016263297872340423, + "loss": 0.6354, + "step": 21260 + }, + { + "epoch": 18.61, + "learning_rate": 0.0001625664893617021, + "loss": 0.4327, + "step": 21270 + }, + { + "epoch": 18.62, + "learning_rate": 0.00016249999999999997, + "loss": 0.6283, + "step": 21280 + }, + { + "epoch": 18.63, + "learning_rate": 0.00016243351063829784, + "loss": 0.5527, + "step": 21290 + }, + { + "epoch": 18.63, + "learning_rate": 0.00016236702127659573, + "loss": 0.3719, + "step": 21300 + }, + { + "epoch": 18.64, + "learning_rate": 0.0001623005319148936, + "loss": 0.5809, + "step": 21310 + }, + { + "epoch": 18.65, + "learning_rate": 0.00016223404255319147, + "loss": 0.4923, + "step": 21320 + }, + { + "epoch": 18.66, + "learning_rate": 0.00016216755319148934, + "loss": 0.5081, + "step": 21330 + }, + { + "epoch": 18.67, + "learning_rate": 0.0001621010638297872, + "loss": 0.5454, + "step": 21340 + }, + { + "epoch": 18.68, + "learning_rate": 0.00016203457446808508, + "loss": 0.3996, + "step": 21350 + }, + { + "epoch": 18.69, + "learning_rate": 0.00016196808510638295, + "loss": 0.606, + "step": 21360 + }, + { + "epoch": 18.7, + "learning_rate": 0.00016190159574468082, + "loss": 0.4586, + "step": 21370 + }, + { + "epoch": 18.7, + "learning_rate": 0.00016183510638297872, + "loss": 0.6339, + "step": 21380 + }, + { + "epoch": 18.71, + "learning_rate": 0.0001617686170212766, + "loss": 0.4783, + "step": 21390 + }, + { + "epoch": 18.72, + "learning_rate": 0.00016170212765957446, + "loss": 0.451, + "step": 21400 + }, + { + "epoch": 18.73, + "learning_rate": 0.00016163563829787233, + "loss": 0.5994, + "step": 21410 + }, + { + "epoch": 18.74, + "learning_rate": 0.0001615691489361702, + "loss": 0.3993, + "step": 21420 + }, + { + "epoch": 18.75, + "learning_rate": 0.00016150265957446807, + "loss": 0.5211, + "step": 21430 + }, + { + "epoch": 18.76, + "learning_rate": 0.00016143617021276594, + "loss": 0.5571, + "step": 21440 + }, + { + "epoch": 18.77, + "learning_rate": 0.0001613696808510638, + "loss": 0.4245, + "step": 21450 + }, + { + "epoch": 18.77, + "learning_rate": 0.0001613031914893617, + "loss": 0.6263, + "step": 21460 + }, + { + "epoch": 18.78, + "learning_rate": 0.00016123670212765957, + "loss": 0.4876, + "step": 21470 + }, + { + "epoch": 18.79, + "learning_rate": 0.00016117021276595744, + "loss": 0.5689, + "step": 21480 + }, + { + "epoch": 18.8, + "learning_rate": 0.00016110372340425531, + "loss": 0.5488, + "step": 21490 + }, + { + "epoch": 18.81, + "learning_rate": 0.00016103723404255318, + "loss": 0.4915, + "step": 21500 + }, + { + "epoch": 18.82, + "learning_rate": 0.00016097074468085105, + "loss": 0.5903, + "step": 21510 + }, + { + "epoch": 18.83, + "learning_rate": 0.00016090425531914892, + "loss": 0.4799, + "step": 21520 + }, + { + "epoch": 18.84, + "learning_rate": 0.00016083776595744682, + "loss": 0.5862, + "step": 21530 + }, + { + "epoch": 18.84, + "learning_rate": 0.0001607712765957447, + "loss": 0.5923, + "step": 21540 + }, + { + "epoch": 18.85, + "learning_rate": 0.00016070478723404256, + "loss": 0.5033, + "step": 21550 + }, + { + "epoch": 18.86, + "learning_rate": 0.00016063829787234043, + "loss": 0.6566, + "step": 21560 + }, + { + "epoch": 18.87, + "learning_rate": 0.0001605718085106383, + "loss": 0.4458, + "step": 21570 + }, + { + "epoch": 18.88, + "learning_rate": 0.00016050531914893614, + "loss": 0.644, + "step": 21580 + }, + { + "epoch": 18.89, + "learning_rate": 0.000160438829787234, + "loss": 0.5241, + "step": 21590 + }, + { + "epoch": 18.9, + "learning_rate": 0.00016037234042553188, + "loss": 0.42, + "step": 21600 + }, + { + "epoch": 18.9, + "eval_cer1": 0.2872624151784207, + "eval_cer2": 0.26392124692370794, + "eval_cer3": 0.23871283894152237, + "eval_cer4": 0.23935091277890466, + "eval_cer5": 0.2645435244161359, + "eval_loss": 1.0357513427734375, + "eval_runtime": 1285.6703, + "eval_samples_per_second": 6.814, + "step": 21600 + }, + { + "epoch": 18.91, + "learning_rate": 0.00016030585106382975, + "loss": 0.6998, + "step": 21610 + }, + { + "epoch": 18.91, + "learning_rate": 0.00016023936170212762, + "loss": 0.4521, + "step": 21620 + }, + { + "epoch": 18.92, + "learning_rate": 0.00016017287234042552, + "loss": 0.591, + "step": 21630 + }, + { + "epoch": 18.93, + "learning_rate": 0.0001601063829787234, + "loss": 0.5062, + "step": 21640 + }, + { + "epoch": 18.94, + "learning_rate": 0.00016003989361702126, + "loss": 0.4117, + "step": 21650 + }, + { + "epoch": 18.95, + "learning_rate": 0.00015997340425531913, + "loss": 0.596, + "step": 21660 + }, + { + "epoch": 18.96, + "learning_rate": 0.000159906914893617, + "loss": 0.5639, + "step": 21670 + }, + { + "epoch": 18.97, + "learning_rate": 0.00015984042553191487, + "loss": 0.5082, + "step": 21680 + }, + { + "epoch": 18.98, + "learning_rate": 0.00015977393617021274, + "loss": 0.493, + "step": 21690 + }, + { + "epoch": 18.98, + "learning_rate": 0.0001597074468085106, + "loss": 0.4676, + "step": 21700 + }, + { + "epoch": 18.99, + "learning_rate": 0.0001596409574468085, + "loss": 0.5781, + "step": 21710 + }, + { + "epoch": 19.0, + "learning_rate": 0.00015957446808510637, + "loss": 0.5025, + "step": 21720 + }, + { + "epoch": 19.01, + "learning_rate": 0.00015950797872340424, + "loss": 0.4536, + "step": 21730 + }, + { + "epoch": 19.02, + "learning_rate": 0.00015944148936170211, + "loss": 0.2944, + "step": 21740 + }, + { + "epoch": 19.03, + "learning_rate": 0.00015937499999999998, + "loss": 0.5119, + "step": 21750 + }, + { + "epoch": 19.04, + "learning_rate": 0.00015930851063829785, + "loss": 0.515, + "step": 21760 + }, + { + "epoch": 19.05, + "learning_rate": 0.00015924202127659572, + "loss": 0.4115, + "step": 21770 + }, + { + "epoch": 19.06, + "learning_rate": 0.0001591755319148936, + "loss": 0.4773, + "step": 21780 + }, + { + "epoch": 19.06, + "learning_rate": 0.0001591090425531915, + "loss": 0.4156, + "step": 21790 + }, + { + "epoch": 19.07, + "learning_rate": 0.00015904255319148936, + "loss": 0.5364, + "step": 21800 + }, + { + "epoch": 19.08, + "learning_rate": 0.00015897606382978723, + "loss": 0.488, + "step": 21810 + }, + { + "epoch": 19.09, + "learning_rate": 0.0001589095744680851, + "loss": 0.4208, + "step": 21820 + }, + { + "epoch": 19.1, + "learning_rate": 0.00015884308510638297, + "loss": 0.536, + "step": 21830 + }, + { + "epoch": 19.11, + "learning_rate": 0.00015877659574468084, + "loss": 0.3673, + "step": 21840 + }, + { + "epoch": 19.12, + "learning_rate": 0.0001587101063829787, + "loss": 0.5251, + "step": 21850 + }, + { + "epoch": 19.13, + "learning_rate": 0.00015864361702127658, + "loss": 0.4637, + "step": 21860 + }, + { + "epoch": 19.13, + "learning_rate": 0.00015857712765957448, + "loss": 0.4394, + "step": 21870 + }, + { + "epoch": 19.14, + "learning_rate": 0.00015851063829787235, + "loss": 0.5169, + "step": 21880 + }, + { + "epoch": 19.15, + "learning_rate": 0.00015844414893617022, + "loss": 0.3745, + "step": 21890 + }, + { + "epoch": 19.16, + "learning_rate": 0.00015837765957446809, + "loss": 0.5548, + "step": 21900 + }, + { + "epoch": 19.17, + "learning_rate": 0.00015831117021276596, + "loss": 0.4346, + "step": 21910 + }, + { + "epoch": 19.18, + "learning_rate": 0.00015824468085106383, + "loss": 0.4351, + "step": 21920 + }, + { + "epoch": 19.19, + "learning_rate": 0.00015817819148936167, + "loss": 0.5054, + "step": 21930 + }, + { + "epoch": 19.2, + "learning_rate": 0.00015811170212765954, + "loss": 0.4015, + "step": 21940 + }, + { + "epoch": 19.2, + "learning_rate": 0.0001580452127659574, + "loss": 0.5445, + "step": 21950 + }, + { + "epoch": 19.21, + "learning_rate": 0.00015797872340425528, + "loss": 0.4356, + "step": 21960 + }, + { + "epoch": 19.22, + "learning_rate": 0.00015791223404255318, + "loss": 0.4026, + "step": 21970 + }, + { + "epoch": 19.23, + "learning_rate": 0.00015784574468085105, + "loss": 0.4748, + "step": 21980 + }, + { + "epoch": 19.24, + "learning_rate": 0.00015777925531914892, + "loss": 0.3956, + "step": 21990 + }, + { + "epoch": 19.25, + "learning_rate": 0.00015771276595744679, + "loss": 0.5343, + "step": 22000 + }, + { + "epoch": 19.26, + "learning_rate": 0.00015764627659574465, + "loss": 0.4948, + "step": 22010 + }, + { + "epoch": 19.26, + "learning_rate": 0.00015757978723404252, + "loss": 0.4326, + "step": 22020 + }, + { + "epoch": 19.27, + "learning_rate": 0.0001575132978723404, + "loss": 0.4713, + "step": 22030 + }, + { + "epoch": 19.28, + "learning_rate": 0.0001574468085106383, + "loss": 0.4455, + "step": 22040 + }, + { + "epoch": 19.29, + "learning_rate": 0.00015738031914893616, + "loss": 0.554, + "step": 22050 + }, + { + "epoch": 19.3, + "learning_rate": 0.00015731382978723403, + "loss": 0.4462, + "step": 22060 + }, + { + "epoch": 19.31, + "learning_rate": 0.0001572473404255319, + "loss": 0.4602, + "step": 22070 + }, + { + "epoch": 19.32, + "learning_rate": 0.00015718085106382977, + "loss": 0.5636, + "step": 22080 + }, + { + "epoch": 19.33, + "learning_rate": 0.00015711436170212764, + "loss": 0.4309, + "step": 22090 + }, + { + "epoch": 19.33, + "learning_rate": 0.0001570478723404255, + "loss": 0.5513, + "step": 22100 + }, + { + "epoch": 19.34, + "learning_rate": 0.00015698138297872338, + "loss": 0.4773, + "step": 22110 + }, + { + "epoch": 19.35, + "learning_rate": 0.00015691489361702128, + "loss": 0.4786, + "step": 22120 + }, + { + "epoch": 19.36, + "learning_rate": 0.00015684840425531915, + "loss": 0.5069, + "step": 22130 + }, + { + "epoch": 19.37, + "learning_rate": 0.00015678191489361702, + "loss": 0.3374, + "step": 22140 + }, + { + "epoch": 19.38, + "learning_rate": 0.0001567154255319149, + "loss": 0.5003, + "step": 22150 + }, + { + "epoch": 19.39, + "learning_rate": 0.00015664893617021276, + "loss": 0.4456, + "step": 22160 + }, + { + "epoch": 19.4, + "learning_rate": 0.00015658244680851063, + "loss": 0.3916, + "step": 22170 + }, + { + "epoch": 19.4, + "learning_rate": 0.0001565159574468085, + "loss": 0.5528, + "step": 22180 + }, + { + "epoch": 19.41, + "learning_rate": 0.00015644946808510637, + "loss": 0.3493, + "step": 22190 + }, + { + "epoch": 19.42, + "learning_rate": 0.00015638297872340426, + "loss": 0.5736, + "step": 22200 + }, + { + "epoch": 19.42, + "eval_cer1": 0.28699233651801087, + "eval_cer2": 0.2619196062346185, + "eval_cer3": 0.23681803332244364, + "eval_cer4": 0.24022022602144305, + "eval_cer5": 0.267515923566879, + "eval_loss": 1.0466623306274414, + "eval_runtime": 1302.8872, + "eval_samples_per_second": 6.724, + "step": 22200 + }, + { + "epoch": 19.43, + "learning_rate": 0.00015631648936170213, + "loss": 0.4342, + "step": 22210 + }, + { + "epoch": 19.44, + "learning_rate": 0.00015625, + "loss": 0.4106, + "step": 22220 + }, + { + "epoch": 19.45, + "learning_rate": 0.00015618351063829787, + "loss": 0.5392, + "step": 22230 + }, + { + "epoch": 19.46, + "learning_rate": 0.00015611702127659574, + "loss": 0.3515, + "step": 22240 + }, + { + "epoch": 19.47, + "learning_rate": 0.0001560505319148936, + "loss": 0.6013, + "step": 22250 + }, + { + "epoch": 19.47, + "learning_rate": 0.00015598404255319148, + "loss": 0.5146, + "step": 22260 + }, + { + "epoch": 19.48, + "learning_rate": 0.00015591755319148935, + "loss": 0.4502, + "step": 22270 + }, + { + "epoch": 19.49, + "learning_rate": 0.0001558510638297872, + "loss": 0.5387, + "step": 22280 + }, + { + "epoch": 19.5, + "learning_rate": 0.00015578457446808507, + "loss": 0.3682, + "step": 22290 + }, + { + "epoch": 19.51, + "learning_rate": 0.00015571808510638296, + "loss": 0.5577, + "step": 22300 + }, + { + "epoch": 19.52, + "learning_rate": 0.00015565159574468083, + "loss": 0.3955, + "step": 22310 + }, + { + "epoch": 19.53, + "learning_rate": 0.0001555851063829787, + "loss": 0.4984, + "step": 22320 + }, + { + "epoch": 19.54, + "learning_rate": 0.00015551861702127657, + "loss": 0.5044, + "step": 22330 + }, + { + "epoch": 19.54, + "learning_rate": 0.00015545212765957444, + "loss": 0.3285, + "step": 22340 + }, + { + "epoch": 19.55, + "learning_rate": 0.0001553856382978723, + "loss": 0.5716, + "step": 22350 + }, + { + "epoch": 19.56, + "learning_rate": 0.00015531914893617018, + "loss": 0.4688, + "step": 22360 + }, + { + "epoch": 19.57, + "learning_rate": 0.00015525265957446805, + "loss": 0.4502, + "step": 22370 + }, + { + "epoch": 19.58, + "learning_rate": 0.00015518617021276595, + "loss": 0.5576, + "step": 22380 + }, + { + "epoch": 19.59, + "learning_rate": 0.00015511968085106382, + "loss": 0.3756, + "step": 22390 + }, + { + "epoch": 19.6, + "learning_rate": 0.0001550531914893617, + "loss": 0.5045, + "step": 22400 + }, + { + "epoch": 19.61, + "learning_rate": 0.00015498670212765956, + "loss": 0.474, + "step": 22410 + }, + { + "epoch": 19.61, + "learning_rate": 0.00015492021276595743, + "loss": 0.3889, + "step": 22420 + }, + { + "epoch": 19.62, + "learning_rate": 0.0001548537234042553, + "loss": 0.5142, + "step": 22430 + }, + { + "epoch": 19.63, + "learning_rate": 0.00015478723404255317, + "loss": 0.4911, + "step": 22440 + }, + { + "epoch": 19.64, + "learning_rate": 0.00015472074468085104, + "loss": 0.5799, + "step": 22450 + }, + { + "epoch": 19.65, + "learning_rate": 0.00015465425531914893, + "loss": 0.4783, + "step": 22460 + }, + { + "epoch": 19.66, + "learning_rate": 0.0001545877659574468, + "loss": 0.4639, + "step": 22470 + }, + { + "epoch": 19.67, + "learning_rate": 0.00015452127659574467, + "loss": 0.5209, + "step": 22480 + }, + { + "epoch": 19.68, + "learning_rate": 0.00015445478723404254, + "loss": 0.411, + "step": 22490 + }, + { + "epoch": 19.68, + "learning_rate": 0.0001543882978723404, + "loss": 0.553, + "step": 22500 + }, + { + "epoch": 19.69, + "learning_rate": 0.00015432180851063828, + "loss": 0.4449, + "step": 22510 + }, + { + "epoch": 19.7, + "learning_rate": 0.00015425531914893615, + "loss": 0.4784, + "step": 22520 + }, + { + "epoch": 19.71, + "learning_rate": 0.00015418882978723402, + "loss": 0.4938, + "step": 22530 + }, + { + "epoch": 19.72, + "learning_rate": 0.00015412234042553192, + "loss": 0.3715, + "step": 22540 + }, + { + "epoch": 19.73, + "learning_rate": 0.0001540558510638298, + "loss": 0.6178, + "step": 22550 + }, + { + "epoch": 19.74, + "learning_rate": 0.00015398936170212766, + "loss": 0.4751, + "step": 22560 + }, + { + "epoch": 19.75, + "learning_rate": 0.00015392287234042553, + "loss": 0.4297, + "step": 22570 + }, + { + "epoch": 19.75, + "learning_rate": 0.0001538563829787234, + "loss": 0.5751, + "step": 22580 + }, + { + "epoch": 19.76, + "learning_rate": 0.00015378989361702127, + "loss": 0.3924, + "step": 22590 + }, + { + "epoch": 19.77, + "learning_rate": 0.00015372340425531914, + "loss": 0.5138, + "step": 22600 + }, + { + "epoch": 19.78, + "learning_rate": 0.000153656914893617, + "loss": 0.4222, + "step": 22610 + }, + { + "epoch": 19.79, + "learning_rate": 0.0001535904255319149, + "loss": 0.4328, + "step": 22620 + }, + { + "epoch": 19.8, + "learning_rate": 0.00015352393617021278, + "loss": 0.5116, + "step": 22630 + }, + { + "epoch": 19.81, + "learning_rate": 0.00015345744680851062, + "loss": 0.4284, + "step": 22640 + }, + { + "epoch": 19.82, + "learning_rate": 0.0001533909574468085, + "loss": 0.6658, + "step": 22650 + }, + { + "epoch": 19.82, + "learning_rate": 0.00015332446808510636, + "loss": 0.5538, + "step": 22660 + }, + { + "epoch": 19.83, + "learning_rate": 0.00015325797872340423, + "loss": 0.5506, + "step": 22670 + }, + { + "epoch": 19.84, + "learning_rate": 0.0001531914893617021, + "loss": 0.5281, + "step": 22680 + }, + { + "epoch": 19.85, + "learning_rate": 0.00015312499999999997, + "loss": 0.3618, + "step": 22690 + }, + { + "epoch": 19.86, + "learning_rate": 0.00015305851063829784, + "loss": 0.5728, + "step": 22700 + }, + { + "epoch": 19.87, + "learning_rate": 0.00015299202127659573, + "loss": 0.4494, + "step": 22710 + }, + { + "epoch": 19.88, + "learning_rate": 0.0001529255319148936, + "loss": 0.4703, + "step": 22720 + }, + { + "epoch": 19.89, + "learning_rate": 0.00015285904255319147, + "loss": 0.4973, + "step": 22730 + }, + { + "epoch": 19.89, + "learning_rate": 0.00015279255319148934, + "loss": 0.4946, + "step": 22740 + }, + { + "epoch": 19.9, + "learning_rate": 0.00015272606382978721, + "loss": 0.5715, + "step": 22750 + }, + { + "epoch": 19.91, + "learning_rate": 0.00015265957446808508, + "loss": 0.4535, + "step": 22760 + }, + { + "epoch": 19.92, + "learning_rate": 0.00015259308510638295, + "loss": 0.4902, + "step": 22770 + }, + { + "epoch": 19.93, + "learning_rate": 0.00015252659574468082, + "loss": 0.5148, + "step": 22780 + }, + { + "epoch": 19.94, + "learning_rate": 0.00015246010638297872, + "loss": 0.469, + "step": 22790 + }, + { + "epoch": 19.95, + "learning_rate": 0.0001523936170212766, + "loss": 0.5532, + "step": 22800 + }, + { + "epoch": 19.95, + "eval_cer1": 0.28699233651801087, + "eval_cer2": 0.2643150123051682, + "eval_cer3": 0.24041163018621364, + "eval_cer4": 0.24141150713158827, + "eval_cer5": 0.2669214437367304, + "eval_loss": 1.0525282621383667, + "eval_runtime": 1312.9229, + "eval_samples_per_second": 6.672, + "step": 22800 + }, + { + "epoch": 19.96, + "learning_rate": 0.00015232712765957446, + "loss": 0.4585, + "step": 22810 + }, + { + "epoch": 19.96, + "learning_rate": 0.00015226063829787233, + "loss": 0.4733, + "step": 22820 + }, + { + "epoch": 19.97, + "learning_rate": 0.0001521941489361702, + "loss": 0.5658, + "step": 22830 + }, + { + "epoch": 19.98, + "learning_rate": 0.00015212765957446807, + "loss": 0.3982, + "step": 22840 + }, + { + "epoch": 19.99, + "learning_rate": 0.00015206117021276594, + "loss": 0.5479, + "step": 22850 + }, + { + "epoch": 20.0, + "learning_rate": 0.0001519946808510638, + "loss": 0.3584, + "step": 22860 + }, + { + "epoch": 20.01, + "learning_rate": 0.0001519281914893617, + "loss": 0.6497, + "step": 22870 + }, + { + "epoch": 20.02, + "learning_rate": 0.00015186170212765958, + "loss": 0.351, + "step": 22880 + }, + { + "epoch": 20.03, + "learning_rate": 0.00015179521276595745, + "loss": 0.4643, + "step": 22890 + }, + { + "epoch": 20.03, + "learning_rate": 0.00015172872340425532, + "loss": 0.4563, + "step": 22900 + }, + { + "epoch": 20.04, + "learning_rate": 0.00015166223404255319, + "loss": 0.3648, + "step": 22910 + }, + { + "epoch": 20.05, + "learning_rate": 0.00015159574468085106, + "loss": 0.549, + "step": 22920 + }, + { + "epoch": 20.06, + "learning_rate": 0.00015152925531914893, + "loss": 0.3499, + "step": 22930 + }, + { + "epoch": 20.07, + "learning_rate": 0.0001514627659574468, + "loss": 0.4264, + "step": 22940 + }, + { + "epoch": 20.08, + "learning_rate": 0.0001513962765957447, + "loss": 0.4634, + "step": 22950 + }, + { + "epoch": 20.09, + "learning_rate": 0.00015132978723404256, + "loss": 0.3053, + "step": 22960 + }, + { + "epoch": 20.1, + "learning_rate": 0.00015126329787234043, + "loss": 0.5776, + "step": 22970 + }, + { + "epoch": 20.1, + "learning_rate": 0.0001511968085106383, + "loss": 0.3879, + "step": 22980 + }, + { + "epoch": 20.11, + "learning_rate": 0.00015113031914893615, + "loss": 0.4074, + "step": 22990 + }, + { + "epoch": 20.12, + "learning_rate": 0.00015106382978723401, + "loss": 0.4447, + "step": 23000 + }, + { + "epoch": 20.13, + "learning_rate": 0.00015099734042553188, + "loss": 0.3202, + "step": 23010 + }, + { + "epoch": 20.14, + "learning_rate": 0.00015093085106382975, + "loss": 0.5024, + "step": 23020 + }, + { + "epoch": 20.15, + "learning_rate": 0.00015086436170212762, + "loss": 0.351, + "step": 23030 + }, + { + "epoch": 20.16, + "learning_rate": 0.0001507978723404255, + "loss": 0.4579, + "step": 23040 + }, + { + "epoch": 20.17, + "learning_rate": 0.0001507313829787234, + "loss": 0.5248, + "step": 23050 + }, + { + "epoch": 20.17, + "learning_rate": 0.00015066489361702126, + "loss": 0.351, + "step": 23060 + }, + { + "epoch": 20.18, + "learning_rate": 0.00015059840425531913, + "loss": 0.5476, + "step": 23070 + }, + { + "epoch": 20.19, + "learning_rate": 0.000150531914893617, + "loss": 0.4098, + "step": 23080 + }, + { + "epoch": 20.2, + "learning_rate": 0.00015046542553191487, + "loss": 0.4718, + "step": 23090 + }, + { + "epoch": 20.21, + "learning_rate": 0.00015039893617021274, + "loss": 0.5629, + "step": 23100 + }, + { + "epoch": 20.22, + "learning_rate": 0.0001503324468085106, + "loss": 0.3173, + "step": 23110 + }, + { + "epoch": 20.23, + "learning_rate": 0.00015026595744680848, + "loss": 0.4894, + "step": 23120 + }, + { + "epoch": 20.24, + "learning_rate": 0.00015019946808510638, + "loss": 0.3124, + "step": 23130 + }, + { + "epoch": 20.24, + "learning_rate": 0.00015013297872340425, + "loss": 0.4747, + "step": 23140 + }, + { + "epoch": 20.25, + "learning_rate": 0.00015006648936170212, + "loss": 0.4302, + "step": 23150 + }, + { + "epoch": 20.26, + "learning_rate": 0.00015, + "loss": 0.334, + "step": 23160 + }, + { + "epoch": 20.27, + "learning_rate": 0.00014993351063829786, + "loss": 0.5744, + "step": 23170 + }, + { + "epoch": 20.28, + "learning_rate": 0.00014986702127659573, + "loss": 0.3977, + "step": 23180 + }, + { + "epoch": 20.29, + "learning_rate": 0.0001498005319148936, + "loss": 0.4895, + "step": 23190 + }, + { + "epoch": 20.3, + "learning_rate": 0.0001497340425531915, + "loss": 0.424, + "step": 23200 + }, + { + "epoch": 20.31, + "learning_rate": 0.00014966755319148936, + "loss": 0.2947, + "step": 23210 + }, + { + "epoch": 20.31, + "learning_rate": 0.00014960106382978723, + "loss": 0.5199, + "step": 23220 + }, + { + "epoch": 20.32, + "learning_rate": 0.0001495345744680851, + "loss": 0.3872, + "step": 23230 + }, + { + "epoch": 20.33, + "learning_rate": 0.00014946808510638297, + "loss": 0.4685, + "step": 23240 + }, + { + "epoch": 20.34, + "learning_rate": 0.00014940159574468084, + "loss": 0.4455, + "step": 23250 + }, + { + "epoch": 20.35, + "learning_rate": 0.0001493351063829787, + "loss": 0.3553, + "step": 23260 + }, + { + "epoch": 20.36, + "learning_rate": 0.00014926861702127658, + "loss": 0.5332, + "step": 23270 + }, + { + "epoch": 20.37, + "learning_rate": 0.00014920212765957445, + "loss": 0.381, + "step": 23280 + }, + { + "epoch": 20.38, + "learning_rate": 0.00014913563829787232, + "loss": 0.441, + "step": 23290 + }, + { + "epoch": 20.38, + "learning_rate": 0.0001490691489361702, + "loss": 0.4342, + "step": 23300 + }, + { + "epoch": 20.39, + "learning_rate": 0.00014900265957446806, + "loss": 0.3428, + "step": 23310 + }, + { + "epoch": 20.4, + "learning_rate": 0.00014893617021276593, + "loss": 0.5913, + "step": 23320 + }, + { + "epoch": 20.41, + "learning_rate": 0.00014886968085106383, + "loss": 0.5022, + "step": 23330 + }, + { + "epoch": 20.42, + "learning_rate": 0.0001488031914893617, + "loss": 0.4988, + "step": 23340 + }, + { + "epoch": 20.43, + "learning_rate": 0.00014873670212765957, + "loss": 0.4764, + "step": 23350 + }, + { + "epoch": 20.44, + "learning_rate": 0.00014867021276595744, + "loss": 0.2748, + "step": 23360 + }, + { + "epoch": 20.45, + "learning_rate": 0.0001486037234042553, + "loss": 0.5289, + "step": 23370 + }, + { + "epoch": 20.45, + "learning_rate": 0.00014853723404255318, + "loss": 0.3794, + "step": 23380 + }, + { + "epoch": 20.46, + "learning_rate": 0.00014847074468085105, + "loss": 0.416, + "step": 23390 + }, + { + "epoch": 20.47, + "learning_rate": 0.00014840425531914892, + "loss": 0.4617, + "step": 23400 + }, + { + "epoch": 20.47, + "eval_cer1": 0.2836163532628878, + "eval_cer2": 0.25899917965545527, + "eval_cer3": 0.23394315583142763, + "eval_cer4": 0.2339418526031102, + "eval_cer5": 0.25613588110403396, + "eval_loss": 1.036176323890686, + "eval_runtime": 1318.1208, + "eval_samples_per_second": 6.646, + "step": 23400 + }, + { + "epoch": 20.48, + "learning_rate": 0.00014833776595744681, + "loss": 0.337, + "step": 23410 + }, + { + "epoch": 20.49, + "learning_rate": 0.00014827127659574468, + "loss": 0.5062, + "step": 23420 + }, + { + "epoch": 20.5, + "learning_rate": 0.00014820478723404253, + "loss": 0.4902, + "step": 23430 + }, + { + "epoch": 20.51, + "learning_rate": 0.0001481382978723404, + "loss": 0.4485, + "step": 23440 + }, + { + "epoch": 20.52, + "learning_rate": 0.00014807180851063827, + "loss": 0.4609, + "step": 23450 + }, + { + "epoch": 20.52, + "learning_rate": 0.00014800531914893616, + "loss": 0.359, + "step": 23460 + }, + { + "epoch": 20.53, + "learning_rate": 0.00014793882978723403, + "loss": 0.5884, + "step": 23470 + }, + { + "epoch": 20.54, + "learning_rate": 0.0001478723404255319, + "loss": 0.4197, + "step": 23480 + }, + { + "epoch": 20.55, + "learning_rate": 0.00014780585106382977, + "loss": 0.4504, + "step": 23490 + }, + { + "epoch": 20.56, + "learning_rate": 0.00014773936170212764, + "loss": 0.4957, + "step": 23500 + }, + { + "epoch": 20.57, + "learning_rate": 0.0001476728723404255, + "loss": 0.3328, + "step": 23510 + }, + { + "epoch": 20.58, + "learning_rate": 0.00014760638297872338, + "loss": 0.5621, + "step": 23520 + }, + { + "epoch": 20.59, + "learning_rate": 0.00014753989361702125, + "loss": 0.4464, + "step": 23530 + }, + { + "epoch": 20.59, + "learning_rate": 0.00014747340425531915, + "loss": 0.4985, + "step": 23540 + }, + { + "epoch": 20.6, + "learning_rate": 0.00014740691489361702, + "loss": 0.4642, + "step": 23550 + }, + { + "epoch": 20.61, + "learning_rate": 0.0001473404255319149, + "loss": 0.3448, + "step": 23560 + }, + { + "epoch": 20.62, + "learning_rate": 0.00014727393617021276, + "loss": 0.5492, + "step": 23570 + }, + { + "epoch": 20.63, + "learning_rate": 0.00014720744680851063, + "loss": 0.3898, + "step": 23580 + }, + { + "epoch": 20.64, + "learning_rate": 0.0001471409574468085, + "loss": 0.4735, + "step": 23590 + }, + { + "epoch": 20.65, + "learning_rate": 0.00014707446808510637, + "loss": 0.4084, + "step": 23600 + }, + { + "epoch": 20.66, + "learning_rate": 0.00014700797872340424, + "loss": 0.3114, + "step": 23610 + }, + { + "epoch": 20.66, + "learning_rate": 0.0001469414893617021, + "loss": 0.6112, + "step": 23620 + }, + { + "epoch": 20.67, + "learning_rate": 0.00014687499999999998, + "loss": 0.4127, + "step": 23630 + }, + { + "epoch": 20.68, + "learning_rate": 0.00014680851063829785, + "loss": 0.4579, + "step": 23640 + }, + { + "epoch": 20.69, + "learning_rate": 0.00014674202127659572, + "loss": 0.4352, + "step": 23650 + }, + { + "epoch": 20.7, + "learning_rate": 0.0001466755319148936, + "loss": 0.3069, + "step": 23660 + }, + { + "epoch": 20.71, + "learning_rate": 0.00014660904255319149, + "loss": 0.5741, + "step": 23670 + }, + { + "epoch": 20.72, + "learning_rate": 0.00014654255319148936, + "loss": 0.3921, + "step": 23680 + }, + { + "epoch": 20.73, + "learning_rate": 0.00014647606382978722, + "loss": 0.4841, + "step": 23690 + }, + { + "epoch": 20.73, + "learning_rate": 0.0001464095744680851, + "loss": 0.4196, + "step": 23700 + }, + { + "epoch": 20.74, + "learning_rate": 0.00014634308510638296, + "loss": 0.3968, + "step": 23710 + }, + { + "epoch": 20.75, + "learning_rate": 0.00014627659574468083, + "loss": 0.5564, + "step": 23720 + }, + { + "epoch": 20.76, + "learning_rate": 0.0001462101063829787, + "loss": 0.3825, + "step": 23730 + }, + { + "epoch": 20.77, + "learning_rate": 0.0001461436170212766, + "loss": 0.4738, + "step": 23740 + }, + { + "epoch": 20.78, + "learning_rate": 0.00014607712765957447, + "loss": 0.5435, + "step": 23750 + }, + { + "epoch": 20.79, + "learning_rate": 0.00014601063829787234, + "loss": 0.359, + "step": 23760 + }, + { + "epoch": 20.8, + "learning_rate": 0.0001459441489361702, + "loss": 0.5754, + "step": 23770 + }, + { + "epoch": 20.8, + "learning_rate": 0.00014587765957446805, + "loss": 0.4005, + "step": 23780 + }, + { + "epoch": 20.81, + "learning_rate": 0.00014581117021276595, + "loss": 0.5477, + "step": 23790 + }, + { + "epoch": 20.82, + "learning_rate": 0.00014574468085106382, + "loss": 0.4592, + "step": 23800 + }, + { + "epoch": 20.83, + "learning_rate": 0.0001456781914893617, + "loss": 0.3583, + "step": 23810 + }, + { + "epoch": 20.84, + "learning_rate": 0.00014561170212765956, + "loss": 0.5245, + "step": 23820 + }, + { + "epoch": 20.85, + "learning_rate": 0.00014554521276595743, + "loss": 0.3789, + "step": 23830 + }, + { + "epoch": 20.86, + "learning_rate": 0.0001454787234042553, + "loss": 0.4733, + "step": 23840 + }, + { + "epoch": 20.87, + "learning_rate": 0.00014541223404255317, + "loss": 0.4335, + "step": 23850 + }, + { + "epoch": 20.87, + "learning_rate": 0.00014534574468085104, + "loss": 0.3584, + "step": 23860 + }, + { + "epoch": 20.88, + "learning_rate": 0.00014527925531914894, + "loss": 0.5562, + "step": 23870 + }, + { + "epoch": 20.89, + "learning_rate": 0.0001452127659574468, + "loss": 0.3774, + "step": 23880 + }, + { + "epoch": 20.9, + "learning_rate": 0.00014514627659574468, + "loss": 0.477, + "step": 23890 + }, + { + "epoch": 20.91, + "learning_rate": 0.00014507978723404255, + "loss": 0.4925, + "step": 23900 + }, + { + "epoch": 20.92, + "learning_rate": 0.00014501329787234042, + "loss": 0.3446, + "step": 23910 + }, + { + "epoch": 20.93, + "learning_rate": 0.00014494680851063829, + "loss": 0.5452, + "step": 23920 + }, + { + "epoch": 20.94, + "learning_rate": 0.00014488031914893616, + "loss": 0.4138, + "step": 23930 + }, + { + "epoch": 20.94, + "learning_rate": 0.00014481382978723403, + "loss": 0.4809, + "step": 23940 + }, + { + "epoch": 20.95, + "learning_rate": 0.00014474734042553192, + "loss": 0.4158, + "step": 23950 + }, + { + "epoch": 20.96, + "learning_rate": 0.00014468085106382977, + "loss": 0.3165, + "step": 23960 + }, + { + "epoch": 20.97, + "learning_rate": 0.00014461436170212764, + "loss": 0.5763, + "step": 23970 + }, + { + "epoch": 20.98, + "learning_rate": 0.0001445478723404255, + "loss": 0.438, + "step": 23980 + }, + { + "epoch": 20.99, + "learning_rate": 0.00014448138297872337, + "loss": 0.4939, + "step": 23990 + }, + { + "epoch": 21.0, + "learning_rate": 0.00014441489361702127, + "loss": 0.4442, + "step": 24000 + }, + { + "epoch": 21.0, + "eval_cer1": 0.2774045440734614, + "eval_cer2": 0.25640689089417557, + "eval_cer3": 0.2305455733420451, + "eval_cer4": 0.2344891979780418, + "eval_cer5": 0.25154989384288745, + "eval_loss": 1.0287288427352905, + "eval_runtime": 1322.1816, + "eval_samples_per_second": 6.625, + "step": 24000 + }, + { + "epoch": 21.01, + "learning_rate": 0.00014434840425531914, + "loss": 0.5521, + "step": 24010 + }, + { + "epoch": 21.01, + "learning_rate": 0.000144281914893617, + "loss": 0.3416, + "step": 24020 + }, + { + "epoch": 21.02, + "learning_rate": 0.00014421542553191488, + "loss": 0.3814, + "step": 24030 + }, + { + "epoch": 21.03, + "learning_rate": 0.00014414893617021275, + "loss": 0.4344, + "step": 24040 + }, + { + "epoch": 21.04, + "learning_rate": 0.00014408244680851062, + "loss": 0.3121, + "step": 24050 + }, + { + "epoch": 21.05, + "learning_rate": 0.0001440159574468085, + "loss": 0.4895, + "step": 24060 + }, + { + "epoch": 21.06, + "learning_rate": 0.00014394946808510636, + "loss": 0.3439, + "step": 24070 + }, + { + "epoch": 21.07, + "learning_rate": 0.00014388297872340426, + "loss": 0.3263, + "step": 24080 + }, + { + "epoch": 21.08, + "learning_rate": 0.00014381648936170213, + "loss": 0.4485, + "step": 24090 + }, + { + "epoch": 21.08, + "learning_rate": 0.00014375, + "loss": 0.2931, + "step": 24100 + }, + { + "epoch": 21.09, + "learning_rate": 0.00014368351063829787, + "loss": 0.4693, + "step": 24110 + }, + { + "epoch": 21.1, + "learning_rate": 0.00014361702127659574, + "loss": 0.3455, + "step": 24120 + }, + { + "epoch": 21.11, + "learning_rate": 0.0001435505319148936, + "loss": 0.2965, + "step": 24130 + }, + { + "epoch": 21.12, + "learning_rate": 0.00014348404255319148, + "loss": 0.4289, + "step": 24140 + }, + { + "epoch": 21.13, + "learning_rate": 0.00014341755319148935, + "loss": 0.3659, + "step": 24150 + }, + { + "epoch": 21.14, + "learning_rate": 0.00014335106382978722, + "loss": 0.5026, + "step": 24160 + }, + { + "epoch": 21.15, + "learning_rate": 0.0001432845744680851, + "loss": 0.386, + "step": 24170 + }, + { + "epoch": 21.15, + "learning_rate": 0.00014321808510638296, + "loss": 0.3223, + "step": 24180 + }, + { + "epoch": 21.16, + "learning_rate": 0.00014315159574468083, + "loss": 0.4534, + "step": 24190 + }, + { + "epoch": 21.17, + "learning_rate": 0.0001430851063829787, + "loss": 0.3164, + "step": 24200 + }, + { + "epoch": 21.18, + "learning_rate": 0.0001430186170212766, + "loss": 0.4428, + "step": 24210 + }, + { + "epoch": 21.19, + "learning_rate": 0.00014295212765957446, + "loss": 0.357, + "step": 24220 + }, + { + "epoch": 21.2, + "learning_rate": 0.00014288563829787233, + "loss": 0.3794, + "step": 24230 + }, + { + "epoch": 21.21, + "learning_rate": 0.0001428191489361702, + "loss": 0.4765, + "step": 24240 + }, + { + "epoch": 21.22, + "learning_rate": 0.00014275265957446807, + "loss": 0.2988, + "step": 24250 + }, + { + "epoch": 21.22, + "learning_rate": 0.00014268617021276594, + "loss": 0.4884, + "step": 24260 + }, + { + "epoch": 21.23, + "learning_rate": 0.0001426196808510638, + "loss": 0.3604, + "step": 24270 + }, + { + "epoch": 21.24, + "learning_rate": 0.00014255319148936168, + "loss": 0.3667, + "step": 24280 + }, + { + "epoch": 21.25, + "learning_rate": 0.00014248670212765958, + "loss": 0.4544, + "step": 24290 + }, + { + "epoch": 21.26, + "learning_rate": 0.00014242021276595745, + "loss": 0.3478, + "step": 24300 + }, + { + "epoch": 21.27, + "learning_rate": 0.0001423537234042553, + "loss": 0.4604, + "step": 24310 + }, + { + "epoch": 21.28, + "learning_rate": 0.00014228723404255316, + "loss": 0.3385, + "step": 24320 + }, + { + "epoch": 21.29, + "learning_rate": 0.00014222074468085106, + "loss": 0.3948, + "step": 24330 + }, + { + "epoch": 21.29, + "learning_rate": 0.00014215425531914893, + "loss": 0.5452, + "step": 24340 + }, + { + "epoch": 21.3, + "learning_rate": 0.0001420877659574468, + "loss": 0.3078, + "step": 24350 + }, + { + "epoch": 21.31, + "learning_rate": 0.00014202127659574467, + "loss": 0.4571, + "step": 24360 + }, + { + "epoch": 21.32, + "learning_rate": 0.00014195478723404254, + "loss": 0.297, + "step": 24370 + }, + { + "epoch": 21.33, + "learning_rate": 0.0001418882978723404, + "loss": 0.339, + "step": 24380 + }, + { + "epoch": 21.34, + "learning_rate": 0.00014182180851063828, + "loss": 0.4816, + "step": 24390 + }, + { + "epoch": 21.35, + "learning_rate": 0.00014175531914893615, + "loss": 0.2878, + "step": 24400 + }, + { + "epoch": 21.36, + "learning_rate": 0.00014168882978723404, + "loss": 0.4621, + "step": 24410 + }, + { + "epoch": 21.36, + "learning_rate": 0.00014162234042553191, + "loss": 0.4515, + "step": 24420 + }, + { + "epoch": 21.37, + "learning_rate": 0.00014155585106382978, + "loss": 0.3435, + "step": 24430 + }, + { + "epoch": 21.38, + "learning_rate": 0.00014148936170212765, + "loss": 0.4548, + "step": 24440 + }, + { + "epoch": 21.39, + "learning_rate": 0.00014142287234042552, + "loss": 0.3265, + "step": 24450 + }, + { + "epoch": 21.4, + "learning_rate": 0.0001413563829787234, + "loss": 0.5297, + "step": 24460 + }, + { + "epoch": 21.41, + "learning_rate": 0.00014128989361702126, + "loss": 0.4099, + "step": 24470 + }, + { + "epoch": 21.42, + "learning_rate": 0.00014122340425531913, + "loss": 0.4471, + "step": 24480 + }, + { + "epoch": 21.43, + "learning_rate": 0.000141156914893617, + "loss": 0.4924, + "step": 24490 + }, + { + "epoch": 21.43, + "learning_rate": 0.00014109042553191487, + "loss": 0.2733, + "step": 24500 + }, + { + "epoch": 21.44, + "learning_rate": 0.00014102393617021274, + "loss": 0.4417, + "step": 24510 + }, + { + "epoch": 21.45, + "learning_rate": 0.0001409574468085106, + "loss": 0.3721, + "step": 24520 + }, + { + "epoch": 21.46, + "learning_rate": 0.00014089095744680848, + "loss": 0.3949, + "step": 24530 + }, + { + "epoch": 21.47, + "learning_rate": 0.00014082446808510638, + "loss": 0.3895, + "step": 24540 + }, + { + "epoch": 21.48, + "learning_rate": 0.00014075797872340425, + "loss": 0.2757, + "step": 24550 + }, + { + "epoch": 21.49, + "learning_rate": 0.00014069148936170212, + "loss": 0.4789, + "step": 24560 + }, + { + "epoch": 21.5, + "learning_rate": 0.000140625, + "loss": 0.3346, + "step": 24570 + }, + { + "epoch": 21.5, + "learning_rate": 0.00014055851063829786, + "loss": 0.2773, + "step": 24580 + }, + { + "epoch": 21.51, + "learning_rate": 0.00014049202127659573, + "loss": 0.4266, + "step": 24590 + }, + { + "epoch": 21.52, + "learning_rate": 0.0001404255319148936, + "loss": 0.3301, + "step": 24600 + }, + { + "epoch": 21.52, + "eval_cer1": 0.2788899767057155, + "eval_cer2": 0.2549302707136998, + "eval_cer3": 0.22577589023195035, + "eval_cer4": 0.23229981647831546, + "eval_cer5": 0.24883227176220807, + "eval_loss": 1.0316708087921143, + "eval_runtime": 1349.3417, + "eval_samples_per_second": 6.492, + "step": 24600 + }, + { + "epoch": 21.53, + "learning_rate": 0.00014035904255319147, + "loss": 0.4875, + "step": 24610 + }, + { + "epoch": 21.54, + "learning_rate": 0.00014029255319148937, + "loss": 0.3975, + "step": 24620 + }, + { + "epoch": 21.55, + "learning_rate": 0.00014022606382978724, + "loss": 0.3878, + "step": 24630 + }, + { + "epoch": 21.56, + "learning_rate": 0.0001401595744680851, + "loss": 0.4372, + "step": 24640 + }, + { + "epoch": 21.57, + "learning_rate": 0.00014009308510638298, + "loss": 0.325, + "step": 24650 + }, + { + "epoch": 21.57, + "learning_rate": 0.00014002659574468082, + "loss": 0.4956, + "step": 24660 + }, + { + "epoch": 21.58, + "learning_rate": 0.00013996010638297872, + "loss": 0.4298, + "step": 24670 + }, + { + "epoch": 21.59, + "learning_rate": 0.00013989361702127658, + "loss": 0.3395, + "step": 24680 + }, + { + "epoch": 21.6, + "learning_rate": 0.00013982712765957445, + "loss": 0.4925, + "step": 24690 + }, + { + "epoch": 21.61, + "learning_rate": 0.00013976063829787232, + "loss": 0.3045, + "step": 24700 + }, + { + "epoch": 21.62, + "learning_rate": 0.0001396941489361702, + "loss": 0.4871, + "step": 24710 + }, + { + "epoch": 21.63, + "learning_rate": 0.00013962765957446806, + "loss": 0.3903, + "step": 24720 + }, + { + "epoch": 21.64, + "learning_rate": 0.00013956117021276593, + "loss": 0.3896, + "step": 24730 + }, + { + "epoch": 21.64, + "learning_rate": 0.0001394946808510638, + "loss": 0.4938, + "step": 24740 + }, + { + "epoch": 21.65, + "learning_rate": 0.0001394281914893617, + "loss": 0.3297, + "step": 24750 + }, + { + "epoch": 21.66, + "learning_rate": 0.00013936170212765957, + "loss": 0.4553, + "step": 24760 + }, + { + "epoch": 21.67, + "learning_rate": 0.00013929521276595744, + "loss": 0.4428, + "step": 24770 + }, + { + "epoch": 21.68, + "learning_rate": 0.0001392287234042553, + "loss": 0.3274, + "step": 24780 + }, + { + "epoch": 21.69, + "learning_rate": 0.00013916223404255318, + "loss": 0.449, + "step": 24790 + }, + { + "epoch": 21.7, + "learning_rate": 0.00013909574468085105, + "loss": 0.3249, + "step": 24800 + }, + { + "epoch": 21.71, + "learning_rate": 0.00013902925531914892, + "loss": 0.4933, + "step": 24810 + }, + { + "epoch": 21.71, + "learning_rate": 0.0001389627659574468, + "loss": 0.4475, + "step": 24820 + }, + { + "epoch": 21.72, + "learning_rate": 0.0001388962765957447, + "loss": 0.3727, + "step": 24830 + }, + { + "epoch": 21.73, + "learning_rate": 0.00013882978723404253, + "loss": 0.4106, + "step": 24840 + }, + { + "epoch": 21.74, + "learning_rate": 0.0001387632978723404, + "loss": 0.3125, + "step": 24850 + }, + { + "epoch": 21.75, + "learning_rate": 0.00013869680851063827, + "loss": 0.3739, + "step": 24860 + }, + { + "epoch": 21.76, + "learning_rate": 0.00013863031914893617, + "loss": 0.3818, + "step": 24870 + }, + { + "epoch": 21.77, + "learning_rate": 0.00013856382978723404, + "loss": 0.3246, + "step": 24880 + }, + { + "epoch": 21.78, + "learning_rate": 0.0001384973404255319, + "loss": 0.4254, + "step": 24890 + }, + { + "epoch": 21.78, + "learning_rate": 0.00013843085106382978, + "loss": 0.4326, + "step": 24900 + }, + { + "epoch": 21.79, + "learning_rate": 0.00013836436170212765, + "loss": 0.4772, + "step": 24910 + }, + { + "epoch": 21.8, + "learning_rate": 0.00013829787234042552, + "loss": 0.3864, + "step": 24920 + }, + { + "epoch": 21.81, + "learning_rate": 0.00013823138297872339, + "loss": 0.3705, + "step": 24930 + }, + { + "epoch": 21.82, + "learning_rate": 0.00013816489361702126, + "loss": 0.5329, + "step": 24940 + }, + { + "epoch": 21.83, + "learning_rate": 0.00013809840425531915, + "loss": 0.3486, + "step": 24950 + }, + { + "epoch": 21.84, + "learning_rate": 0.00013803191489361702, + "loss": 0.4645, + "step": 24960 + }, + { + "epoch": 21.85, + "learning_rate": 0.0001379654255319149, + "loss": 0.3957, + "step": 24970 + }, + { + "epoch": 21.85, + "learning_rate": 0.00013789893617021276, + "loss": 0.4219, + "step": 24980 + }, + { + "epoch": 21.86, + "learning_rate": 0.00013783244680851063, + "loss": 0.4307, + "step": 24990 + }, + { + "epoch": 21.87, + "learning_rate": 0.0001377659574468085, + "loss": 0.3554, + "step": 25000 + }, + { + "epoch": 21.88, + "learning_rate": 0.00013769946808510637, + "loss": 0.4521, + "step": 25010 + }, + { + "epoch": 21.89, + "learning_rate": 0.00013763297872340424, + "loss": 0.4024, + "step": 25020 + }, + { + "epoch": 21.9, + "learning_rate": 0.0001375664893617021, + "loss": 0.4088, + "step": 25030 + }, + { + "epoch": 21.91, + "learning_rate": 0.00013749999999999998, + "loss": 0.5174, + "step": 25040 + }, + { + "epoch": 21.92, + "learning_rate": 0.00013743351063829785, + "loss": 0.341, + "step": 25050 + }, + { + "epoch": 21.92, + "learning_rate": 0.00013736702127659572, + "loss": 0.4856, + "step": 25060 + }, + { + "epoch": 21.93, + "learning_rate": 0.0001373005319148936, + "loss": 0.4195, + "step": 25070 + }, + { + "epoch": 21.94, + "learning_rate": 0.0001372340425531915, + "loss": 0.4866, + "step": 25080 + }, + { + "epoch": 21.95, + "learning_rate": 0.00013716755319148936, + "loss": 0.4518, + "step": 25090 + }, + { + "epoch": 21.96, + "learning_rate": 0.00013710106382978723, + "loss": 0.3093, + "step": 25100 + }, + { + "epoch": 21.97, + "learning_rate": 0.0001370345744680851, + "loss": 0.4767, + "step": 25110 + }, + { + "epoch": 21.98, + "learning_rate": 0.00013696808510638297, + "loss": 0.4058, + "step": 25120 + }, + { + "epoch": 21.99, + "learning_rate": 0.00013690159574468084, + "loss": 0.4197, + "step": 25130 + }, + { + "epoch": 21.99, + "learning_rate": 0.0001368351063829787, + "loss": 0.4374, + "step": 25140 + }, + { + "epoch": 22.0, + "learning_rate": 0.00013676861702127658, + "loss": 0.4609, + "step": 25150 + }, + { + "epoch": 22.01, + "learning_rate": 0.00013670212765957447, + "loss": 0.3799, + "step": 25160 + }, + { + "epoch": 22.02, + "learning_rate": 0.00013663563829787234, + "loss": 0.2781, + "step": 25170 + }, + { + "epoch": 22.03, + "learning_rate": 0.0001365691489361702, + "loss": 0.4925, + "step": 25180 + }, + { + "epoch": 22.04, + "learning_rate": 0.00013650265957446806, + "loss": 0.3444, + "step": 25190 + }, + { + "epoch": 22.05, + "learning_rate": 0.00013643617021276593, + "loss": 0.352, + "step": 25200 + }, + { + "epoch": 22.05, + "eval_cer1": 0.28101684615644307, + "eval_cer2": 0.257292863002461, + "eval_cer3": 0.23302842208428617, + "eval_cer4": 0.2341350333236743, + "eval_cer5": 0.25443736730360933, + "eval_loss": 1.0480974912643433, + "eval_runtime": 1368.8981, + "eval_samples_per_second": 6.399, + "step": 25200 + }, + { + "epoch": 22.06, + "learning_rate": 0.00013636968085106382, + "loss": 0.4391, + "step": 25210 + }, + { + "epoch": 22.06, + "learning_rate": 0.0001363031914893617, + "loss": 0.2822, + "step": 25220 + }, + { + "epoch": 22.07, + "learning_rate": 0.00013623670212765956, + "loss": 0.5069, + "step": 25230 + }, + { + "epoch": 22.08, + "learning_rate": 0.00013617021276595743, + "loss": 0.3563, + "step": 25240 + }, + { + "epoch": 22.09, + "learning_rate": 0.0001361037234042553, + "loss": 0.3632, + "step": 25250 + }, + { + "epoch": 22.1, + "learning_rate": 0.00013603723404255317, + "loss": 0.4024, + "step": 25260 + }, + { + "epoch": 22.11, + "learning_rate": 0.00013597074468085104, + "loss": 0.2997, + "step": 25270 + }, + { + "epoch": 22.12, + "learning_rate": 0.0001359042553191489, + "loss": 0.4593, + "step": 25280 + }, + { + "epoch": 22.13, + "learning_rate": 0.0001358377659574468, + "loss": 0.3679, + "step": 25290 + }, + { + "epoch": 22.13, + "learning_rate": 0.00013577127659574468, + "loss": 0.3822, + "step": 25300 + }, + { + "epoch": 22.14, + "learning_rate": 0.00013570478723404255, + "loss": 0.4141, + "step": 25310 + }, + { + "epoch": 22.15, + "learning_rate": 0.00013563829787234042, + "loss": 0.3059, + "step": 25320 + }, + { + "epoch": 22.16, + "learning_rate": 0.0001355718085106383, + "loss": 0.5324, + "step": 25330 + }, + { + "epoch": 22.17, + "learning_rate": 0.00013550531914893616, + "loss": 0.3478, + "step": 25340 + }, + { + "epoch": 22.18, + "learning_rate": 0.00013543882978723403, + "loss": 0.4233, + "step": 25350 + }, + { + "epoch": 22.19, + "learning_rate": 0.0001353723404255319, + "loss": 0.4273, + "step": 25360 + }, + { + "epoch": 22.2, + "learning_rate": 0.00013530585106382977, + "loss": 0.307, + "step": 25370 + }, + { + "epoch": 22.2, + "learning_rate": 0.00013523936170212764, + "loss": 0.4839, + "step": 25380 + }, + { + "epoch": 22.21, + "learning_rate": 0.0001351728723404255, + "loss": 0.3576, + "step": 25390 + }, + { + "epoch": 22.22, + "learning_rate": 0.00013510638297872338, + "loss": 0.4421, + "step": 25400 + }, + { + "epoch": 22.23, + "learning_rate": 0.00013503989361702127, + "loss": 0.4246, + "step": 25410 + }, + { + "epoch": 22.24, + "learning_rate": 0.00013497340425531914, + "loss": 0.3285, + "step": 25420 + }, + { + "epoch": 22.25, + "learning_rate": 0.00013490691489361701, + "loss": 0.5017, + "step": 25430 + }, + { + "epoch": 22.26, + "learning_rate": 0.00013484042553191488, + "loss": 0.2993, + "step": 25440 + }, + { + "epoch": 22.27, + "learning_rate": 0.00013477393617021275, + "loss": 0.3846, + "step": 25450 + }, + { + "epoch": 22.27, + "learning_rate": 0.00013470744680851062, + "loss": 0.4039, + "step": 25460 + }, + { + "epoch": 22.28, + "learning_rate": 0.0001346409574468085, + "loss": 0.317, + "step": 25470 + }, + { + "epoch": 22.29, + "learning_rate": 0.00013457446808510636, + "loss": 0.4561, + "step": 25480 + }, + { + "epoch": 22.3, + "learning_rate": 0.00013450797872340426, + "loss": 0.3295, + "step": 25490 + }, + { + "epoch": 22.31, + "learning_rate": 0.00013444148936170213, + "loss": 0.3637, + "step": 25500 + }, + { + "epoch": 22.32, + "learning_rate": 0.000134375, + "loss": 0.4201, + "step": 25510 + }, + { + "epoch": 22.33, + "learning_rate": 0.00013430851063829787, + "loss": 0.2746, + "step": 25520 + }, + { + "epoch": 22.34, + "learning_rate": 0.00013424202127659574, + "loss": 0.4375, + "step": 25530 + }, + { + "epoch": 22.34, + "learning_rate": 0.0001341755319148936, + "loss": 0.3407, + "step": 25540 + }, + { + "epoch": 22.35, + "learning_rate": 0.00013410904255319148, + "loss": 0.3252, + "step": 25550 + }, + { + "epoch": 22.36, + "learning_rate": 0.00013404255319148935, + "loss": 0.4388, + "step": 25560 + }, + { + "epoch": 22.37, + "learning_rate": 0.00013397606382978722, + "loss": 0.2982, + "step": 25570 + }, + { + "epoch": 22.38, + "learning_rate": 0.0001339095744680851, + "loss": 0.4699, + "step": 25580 + }, + { + "epoch": 22.39, + "learning_rate": 0.00013384308510638296, + "loss": 0.3127, + "step": 25590 + }, + { + "epoch": 22.4, + "learning_rate": 0.00013377659574468083, + "loss": 0.3841, + "step": 25600 + }, + { + "epoch": 22.41, + "learning_rate": 0.0001337101063829787, + "loss": 0.4032, + "step": 25610 + }, + { + "epoch": 22.41, + "learning_rate": 0.0001336436170212766, + "loss": 0.2641, + "step": 25620 + }, + { + "epoch": 22.42, + "learning_rate": 0.00013357712765957447, + "loss": 0.4513, + "step": 25630 + }, + { + "epoch": 22.43, + "learning_rate": 0.00013351063829787234, + "loss": 0.3007, + "step": 25640 + }, + { + "epoch": 22.44, + "learning_rate": 0.0001334441489361702, + "loss": 0.3445, + "step": 25650 + }, + { + "epoch": 22.45, + "learning_rate": 0.00013337765957446808, + "loss": 0.3983, + "step": 25660 + }, + { + "epoch": 22.46, + "learning_rate": 0.00013331117021276594, + "loss": 0.2326, + "step": 25670 + }, + { + "epoch": 22.47, + "learning_rate": 0.00013324468085106381, + "loss": 0.4835, + "step": 25680 + }, + { + "epoch": 22.48, + "learning_rate": 0.00013317819148936168, + "loss": 0.3081, + "step": 25690 + }, + { + "epoch": 22.48, + "learning_rate": 0.00013311170212765958, + "loss": 0.4082, + "step": 25700 + }, + { + "epoch": 22.49, + "learning_rate": 0.00013304521276595745, + "loss": 0.407, + "step": 25710 + }, + { + "epoch": 22.5, + "learning_rate": 0.0001329787234042553, + "loss": 0.288, + "step": 25720 + }, + { + "epoch": 22.51, + "learning_rate": 0.00013291223404255316, + "loss": 0.4324, + "step": 25730 + }, + { + "epoch": 22.52, + "learning_rate": 0.00013284574468085103, + "loss": 0.4151, + "step": 25740 + }, + { + "epoch": 22.53, + "learning_rate": 0.00013277925531914893, + "loss": 0.3621, + "step": 25750 + }, + { + "epoch": 22.54, + "learning_rate": 0.0001327127659574468, + "loss": 0.4488, + "step": 25760 + }, + { + "epoch": 22.55, + "learning_rate": 0.00013264627659574467, + "loss": 0.2726, + "step": 25770 + }, + { + "epoch": 22.55, + "learning_rate": 0.00013257978723404254, + "loss": 0.4988, + "step": 25780 + }, + { + "epoch": 22.56, + "learning_rate": 0.0001325132978723404, + "loss": 0.3855, + "step": 25790 + }, + { + "epoch": 22.57, + "learning_rate": 0.00013244680851063828, + "loss": 0.3484, + "step": 25800 + }, + { + "epoch": 22.57, + "eval_cer1": 0.27561527294824617, + "eval_cer2": 0.25178014766201806, + "eval_cer3": 0.22727866710225417, + "eval_cer4": 0.2294664992433755, + "eval_cer5": 0.249171974522293, + "eval_loss": 1.0398242473602295, + "eval_runtime": 1371.0312, + "eval_samples_per_second": 6.389, + "step": 25800 + }, + { + "epoch": 22.58, + "learning_rate": 0.00013238031914893615, + "loss": 0.3648, + "step": 25810 + }, + { + "epoch": 22.59, + "learning_rate": 0.00013231382978723402, + "loss": 0.3256, + "step": 25820 + }, + { + "epoch": 22.6, + "learning_rate": 0.00013224734042553192, + "loss": 0.4772, + "step": 25830 + }, + { + "epoch": 22.61, + "learning_rate": 0.0001321808510638298, + "loss": 0.3659, + "step": 25840 + }, + { + "epoch": 22.62, + "learning_rate": 0.00013211436170212766, + "loss": 0.4016, + "step": 25850 + }, + { + "epoch": 22.62, + "learning_rate": 0.00013204787234042553, + "loss": 0.372, + "step": 25860 + }, + { + "epoch": 22.63, + "learning_rate": 0.0001319813829787234, + "loss": 0.4156, + "step": 25870 + }, + { + "epoch": 22.64, + "learning_rate": 0.00013191489361702127, + "loss": 0.4196, + "step": 25880 + }, + { + "epoch": 22.65, + "learning_rate": 0.00013184840425531914, + "loss": 0.3156, + "step": 25890 + }, + { + "epoch": 22.66, + "learning_rate": 0.000131781914893617, + "loss": 0.3585, + "step": 25900 + }, + { + "epoch": 22.67, + "learning_rate": 0.00013171542553191488, + "loss": 0.3941, + "step": 25910 + }, + { + "epoch": 22.68, + "learning_rate": 0.00013164893617021275, + "loss": 0.2504, + "step": 25920 + }, + { + "epoch": 22.69, + "learning_rate": 0.00013158244680851062, + "loss": 0.4609, + "step": 25930 + }, + { + "epoch": 22.69, + "learning_rate": 0.00013151595744680849, + "loss": 0.3998, + "step": 25940 + }, + { + "epoch": 22.7, + "learning_rate": 0.00013144946808510636, + "loss": 0.3959, + "step": 25950 + }, + { + "epoch": 22.71, + "learning_rate": 0.00013138297872340425, + "loss": 0.407, + "step": 25960 + }, + { + "epoch": 22.72, + "learning_rate": 0.00013131648936170212, + "loss": 0.3075, + "step": 25970 + }, + { + "epoch": 22.73, + "learning_rate": 0.00013125, + "loss": 0.5365, + "step": 25980 + }, + { + "epoch": 22.74, + "learning_rate": 0.00013118351063829786, + "loss": 0.3169, + "step": 25990 + }, + { + "epoch": 22.75, + "learning_rate": 0.00013111702127659573, + "loss": 0.379, + "step": 26000 + }, + { + "epoch": 22.76, + "learning_rate": 0.0001310505319148936, + "loss": 0.4853, + "step": 26010 + }, + { + "epoch": 22.76, + "learning_rate": 0.00013098404255319147, + "loss": 0.2365, + "step": 26020 + }, + { + "epoch": 22.77, + "learning_rate": 0.00013091755319148937, + "loss": 0.567, + "step": 26030 + }, + { + "epoch": 22.78, + "learning_rate": 0.00013085106382978724, + "loss": 0.3252, + "step": 26040 + }, + { + "epoch": 22.79, + "learning_rate": 0.0001307845744680851, + "loss": 0.4379, + "step": 26050 + }, + { + "epoch": 22.8, + "learning_rate": 0.00013071808510638298, + "loss": 0.4442, + "step": 26060 + }, + { + "epoch": 22.81, + "learning_rate": 0.00013065159574468082, + "loss": 0.3301, + "step": 26070 + }, + { + "epoch": 22.82, + "learning_rate": 0.00013058510638297872, + "loss": 0.5047, + "step": 26080 + }, + { + "epoch": 22.83, + "learning_rate": 0.0001305186170212766, + "loss": 0.3607, + "step": 26090 + }, + { + "epoch": 22.83, + "learning_rate": 0.00013045212765957446, + "loss": 0.3428, + "step": 26100 + }, + { + "epoch": 22.84, + "learning_rate": 0.00013038563829787233, + "loss": 0.4347, + "step": 26110 + }, + { + "epoch": 22.85, + "learning_rate": 0.0001303191489361702, + "loss": 0.2966, + "step": 26120 + }, + { + "epoch": 22.86, + "learning_rate": 0.00013025265957446807, + "loss": 0.5188, + "step": 26130 + }, + { + "epoch": 22.87, + "learning_rate": 0.00013018617021276594, + "loss": 0.2911, + "step": 26140 + }, + { + "epoch": 22.88, + "learning_rate": 0.0001301196808510638, + "loss": 0.3895, + "step": 26150 + }, + { + "epoch": 22.89, + "learning_rate": 0.0001300531914893617, + "loss": 0.4055, + "step": 26160 + }, + { + "epoch": 22.9, + "learning_rate": 0.00012998670212765957, + "loss": 0.3444, + "step": 26170 + }, + { + "epoch": 22.9, + "learning_rate": 0.00012992021276595744, + "loss": 0.407, + "step": 26180 + }, + { + "epoch": 22.91, + "learning_rate": 0.0001298537234042553, + "loss": 0.3479, + "step": 26190 + }, + { + "epoch": 22.92, + "learning_rate": 0.00012978723404255318, + "loss": 0.3657, + "step": 26200 + }, + { + "epoch": 22.93, + "learning_rate": 0.00012972074468085105, + "loss": 0.4422, + "step": 26210 + }, + { + "epoch": 22.94, + "learning_rate": 0.00012965425531914892, + "loss": 0.3191, + "step": 26220 + }, + { + "epoch": 22.95, + "learning_rate": 0.0001295877659574468, + "loss": 0.4634, + "step": 26230 + }, + { + "epoch": 22.96, + "learning_rate": 0.0001295212765957447, + "loss": 0.3084, + "step": 26240 + }, + { + "epoch": 22.97, + "learning_rate": 0.00012945478723404253, + "loss": 0.3569, + "step": 26250 + }, + { + "epoch": 22.97, + "learning_rate": 0.0001293882978723404, + "loss": 0.4126, + "step": 26260 + }, + { + "epoch": 22.98, + "learning_rate": 0.00012932180851063827, + "loss": 0.3154, + "step": 26270 + }, + { + "epoch": 22.99, + "learning_rate": 0.00012925531914893614, + "loss": 0.4272, + "step": 26280 + }, + { + "epoch": 23.0, + "learning_rate": 0.00012918882978723404, + "loss": 0.3112, + "step": 26290 + }, + { + "epoch": 23.01, + "learning_rate": 0.0001291223404255319, + "loss": 0.4143, + "step": 26300 + }, + { + "epoch": 23.02, + "learning_rate": 0.00012905585106382978, + "loss": 0.2965, + "step": 26310 + }, + { + "epoch": 23.03, + "learning_rate": 0.00012898936170212765, + "loss": 0.3541, + "step": 26320 + }, + { + "epoch": 23.04, + "learning_rate": 0.00012892287234042552, + "loss": 0.3308, + "step": 26330 + }, + { + "epoch": 23.04, + "learning_rate": 0.0001288563829787234, + "loss": 0.2968, + "step": 26340 + }, + { + "epoch": 23.05, + "learning_rate": 0.00012878989361702126, + "loss": 0.4355, + "step": 26350 + }, + { + "epoch": 23.06, + "learning_rate": 0.00012872340425531913, + "loss": 0.2734, + "step": 26360 + }, + { + "epoch": 23.07, + "learning_rate": 0.00012865691489361702, + "loss": 0.3837, + "step": 26370 + }, + { + "epoch": 23.08, + "learning_rate": 0.0001285904255319149, + "loss": 0.3263, + "step": 26380 + }, + { + "epoch": 23.09, + "learning_rate": 0.00012852393617021276, + "loss": 0.295, + "step": 26390 + }, + { + "epoch": 23.1, + "learning_rate": 0.00012845744680851063, + "loss": 0.424, + "step": 26400 + }, + { + "epoch": 23.1, + "eval_cer1": 0.27635798926437327, + "eval_cer2": 0.2505988515176374, + "eval_cer3": 0.22584122835674617, + "eval_cer4": 0.22882256350816188, + "eval_cer5": 0.253588110403397, + "eval_loss": 1.0314199924468994, + "eval_runtime": 1400.8059, + "eval_samples_per_second": 6.254, + "step": 26400 + }, + { + "epoch": 23.11, + "learning_rate": 0.0001283909574468085, + "loss": 0.2717, + "step": 26410 + }, + { + "epoch": 23.11, + "learning_rate": 0.00012832446808510637, + "loss": 0.428, + "step": 26420 + }, + { + "epoch": 23.12, + "learning_rate": 0.00012825797872340424, + "loss": 0.3823, + "step": 26430 + }, + { + "epoch": 23.13, + "learning_rate": 0.00012819148936170211, + "loss": 0.2909, + "step": 26440 + }, + { + "epoch": 23.14, + "learning_rate": 0.00012812499999999998, + "loss": 0.4054, + "step": 26450 + }, + { + "epoch": 23.15, + "learning_rate": 0.00012805851063829785, + "loss": 0.3266, + "step": 26460 + }, + { + "epoch": 23.16, + "learning_rate": 0.00012799202127659572, + "loss": 0.3843, + "step": 26470 + }, + { + "epoch": 23.17, + "learning_rate": 0.0001279255319148936, + "loss": 0.2991, + "step": 26480 + }, + { + "epoch": 23.18, + "learning_rate": 0.00012785904255319146, + "loss": 0.3065, + "step": 26490 + }, + { + "epoch": 23.18, + "learning_rate": 0.00012779255319148936, + "loss": 0.438, + "step": 26500 + }, + { + "epoch": 23.19, + "learning_rate": 0.00012772606382978723, + "loss": 0.2879, + "step": 26510 + }, + { + "epoch": 23.2, + "learning_rate": 0.0001276595744680851, + "loss": 0.3609, + "step": 26520 + }, + { + "epoch": 23.21, + "learning_rate": 0.00012759308510638297, + "loss": 0.391, + "step": 26530 + }, + { + "epoch": 23.22, + "learning_rate": 0.00012752659574468084, + "loss": 0.3833, + "step": 26540 + }, + { + "epoch": 23.23, + "learning_rate": 0.0001274601063829787, + "loss": 0.4542, + "step": 26550 + }, + { + "epoch": 23.24, + "learning_rate": 0.00012739361702127658, + "loss": 0.2725, + "step": 26560 + }, + { + "epoch": 23.25, + "learning_rate": 0.00012732712765957448, + "loss": 0.4266, + "step": 26570 + }, + { + "epoch": 23.25, + "learning_rate": 0.00012726063829787235, + "loss": 0.3592, + "step": 26580 + }, + { + "epoch": 23.26, + "learning_rate": 0.00012719414893617022, + "loss": 0.2933, + "step": 26590 + }, + { + "epoch": 23.27, + "learning_rate": 0.00012712765957446806, + "loss": 0.4514, + "step": 26600 + }, + { + "epoch": 23.28, + "learning_rate": 0.00012706117021276593, + "loss": 0.3054, + "step": 26610 + }, + { + "epoch": 23.29, + "learning_rate": 0.00012699468085106383, + "loss": 0.359, + "step": 26620 + }, + { + "epoch": 23.3, + "learning_rate": 0.0001269281914893617, + "loss": 0.3914, + "step": 26630 + }, + { + "epoch": 23.31, + "learning_rate": 0.00012686170212765957, + "loss": 0.3302, + "step": 26640 + }, + { + "epoch": 23.32, + "learning_rate": 0.00012679521276595744, + "loss": 0.4226, + "step": 26650 + }, + { + "epoch": 23.32, + "learning_rate": 0.0001267287234042553, + "loss": 0.3161, + "step": 26660 + }, + { + "epoch": 23.33, + "learning_rate": 0.00012666223404255317, + "loss": 0.3727, + "step": 26670 + }, + { + "epoch": 23.34, + "learning_rate": 0.00012659574468085104, + "loss": 0.3386, + "step": 26680 + }, + { + "epoch": 23.35, + "learning_rate": 0.00012652925531914891, + "loss": 0.3063, + "step": 26690 + }, + { + "epoch": 23.36, + "learning_rate": 0.0001264627659574468, + "loss": 0.4585, + "step": 26700 + }, + { + "epoch": 23.37, + "learning_rate": 0.00012639627659574468, + "loss": 0.3183, + "step": 26710 + }, + { + "epoch": 23.38, + "learning_rate": 0.00012632978723404255, + "loss": 0.414, + "step": 26720 + }, + { + "epoch": 23.39, + "learning_rate": 0.00012626329787234042, + "loss": 0.364, + "step": 26730 + }, + { + "epoch": 23.39, + "learning_rate": 0.0001261968085106383, + "loss": 0.3201, + "step": 26740 + }, + { + "epoch": 23.4, + "learning_rate": 0.00012613031914893616, + "loss": 0.4593, + "step": 26750 + }, + { + "epoch": 23.41, + "learning_rate": 0.00012606382978723403, + "loss": 0.2704, + "step": 26760 + }, + { + "epoch": 23.42, + "learning_rate": 0.0001259973404255319, + "loss": 0.3844, + "step": 26770 + }, + { + "epoch": 23.43, + "learning_rate": 0.00012593085106382977, + "loss": 0.3405, + "step": 26780 + }, + { + "epoch": 23.44, + "learning_rate": 0.00012586436170212764, + "loss": 0.295, + "step": 26790 + }, + { + "epoch": 23.45, + "learning_rate": 0.0001257978723404255, + "loss": 0.435, + "step": 26800 + }, + { + "epoch": 23.46, + "learning_rate": 0.00012573138297872338, + "loss": 0.3137, + "step": 26810 + }, + { + "epoch": 23.46, + "learning_rate": 0.00012566489361702125, + "loss": 0.364, + "step": 26820 + }, + { + "epoch": 23.47, + "learning_rate": 0.00012559840425531915, + "loss": 0.3592, + "step": 26830 + }, + { + "epoch": 23.48, + "learning_rate": 0.00012553191489361702, + "loss": 0.3229, + "step": 26840 + }, + { + "epoch": 23.49, + "learning_rate": 0.0001254654255319149, + "loss": 0.4261, + "step": 26850 + }, + { + "epoch": 23.5, + "learning_rate": 0.00012539893617021276, + "loss": 0.282, + "step": 26860 + }, + { + "epoch": 23.51, + "learning_rate": 0.00012533244680851063, + "loss": 0.4243, + "step": 26870 + }, + { + "epoch": 23.52, + "learning_rate": 0.0001252659574468085, + "loss": 0.3403, + "step": 26880 + }, + { + "epoch": 23.53, + "learning_rate": 0.00012519946808510637, + "loss": 0.3031, + "step": 26890 + }, + { + "epoch": 23.53, + "learning_rate": 0.00012513297872340424, + "loss": 0.4079, + "step": 26900 + }, + { + "epoch": 23.54, + "learning_rate": 0.00012506648936170213, + "loss": 0.3495, + "step": 26910 + }, + { + "epoch": 23.55, + "learning_rate": 0.000125, + "loss": 0.3684, + "step": 26920 + }, + { + "epoch": 23.56, + "learning_rate": 0.00012493351063829787, + "loss": 0.3207, + "step": 26930 + }, + { + "epoch": 23.57, + "learning_rate": 0.00012486702127659574, + "loss": 0.2546, + "step": 26940 + }, + { + "epoch": 23.58, + "learning_rate": 0.00012480053191489359, + "loss": 0.4764, + "step": 26950 + }, + { + "epoch": 23.59, + "learning_rate": 0.00012473404255319148, + "loss": 0.2915, + "step": 26960 + }, + { + "epoch": 23.6, + "learning_rate": 0.00012466755319148935, + "loss": 0.4261, + "step": 26970 + }, + { + "epoch": 23.6, + "learning_rate": 0.00012460106382978722, + "loss": 0.3006, + "step": 26980 + }, + { + "epoch": 23.61, + "learning_rate": 0.0001245345744680851, + "loss": 0.3342, + "step": 26990 + }, + { + "epoch": 23.62, + "learning_rate": 0.00012446808510638296, + "loss": 0.4164, + "step": 27000 + }, + { + "epoch": 23.62, + "eval_cer1": 0.2698423415819858, + "eval_cer2": 0.2459721082854799, + "eval_cer3": 0.2241424371120549, + "eval_cer4": 0.2256994751923758, + "eval_cer5": 0.25171974522292995, + "eval_loss": 1.0343782901763916, + "eval_runtime": 1386.7142, + "eval_samples_per_second": 6.317, + "step": 27000 + }, + { + "epoch": 23.63, + "learning_rate": 0.00012440159574468083, + "loss": 0.2961, + "step": 27010 + }, + { + "epoch": 23.64, + "learning_rate": 0.0001243351063829787, + "loss": 0.4047, + "step": 27020 + }, + { + "epoch": 23.65, + "learning_rate": 0.00012426861702127657, + "loss": 0.2755, + "step": 27030 + }, + { + "epoch": 23.66, + "learning_rate": 0.00012420212765957447, + "loss": 0.3193, + "step": 27040 + }, + { + "epoch": 23.67, + "learning_rate": 0.00012413563829787234, + "loss": 0.4594, + "step": 27050 + }, + { + "epoch": 23.67, + "learning_rate": 0.0001240691489361702, + "loss": 0.3148, + "step": 27060 + }, + { + "epoch": 23.68, + "learning_rate": 0.00012400265957446808, + "loss": 0.3959, + "step": 27070 + }, + { + "epoch": 23.69, + "learning_rate": 0.00012393617021276595, + "loss": 0.3991, + "step": 27080 + }, + { + "epoch": 23.7, + "learning_rate": 0.00012386968085106382, + "loss": 0.3561, + "step": 27090 + }, + { + "epoch": 23.71, + "learning_rate": 0.0001238031914893617, + "loss": 0.4394, + "step": 27100 + }, + { + "epoch": 23.72, + "learning_rate": 0.00012373670212765956, + "loss": 0.316, + "step": 27110 + }, + { + "epoch": 23.73, + "learning_rate": 0.00012367021276595745, + "loss": 0.4124, + "step": 27120 + }, + { + "epoch": 23.74, + "learning_rate": 0.0001236037234042553, + "loss": 0.3595, + "step": 27130 + }, + { + "epoch": 23.74, + "learning_rate": 0.00012353723404255317, + "loss": 0.2912, + "step": 27140 + }, + { + "epoch": 23.75, + "learning_rate": 0.00012347074468085104, + "loss": 0.4619, + "step": 27150 + }, + { + "epoch": 23.76, + "learning_rate": 0.00012340425531914893, + "loss": 0.2748, + "step": 27160 + }, + { + "epoch": 23.77, + "learning_rate": 0.0001233377659574468, + "loss": 0.4158, + "step": 27170 + }, + { + "epoch": 23.78, + "learning_rate": 0.00012327127659574467, + "loss": 0.3796, + "step": 27180 + }, + { + "epoch": 23.79, + "learning_rate": 0.00012320478723404254, + "loss": 0.2541, + "step": 27190 + }, + { + "epoch": 23.8, + "learning_rate": 0.0001231382978723404, + "loss": 0.4001, + "step": 27200 + }, + { + "epoch": 23.81, + "learning_rate": 0.00012307180851063828, + "loss": 0.2972, + "step": 27210 + }, + { + "epoch": 23.81, + "learning_rate": 0.00012300531914893615, + "loss": 0.4062, + "step": 27220 + }, + { + "epoch": 23.82, + "learning_rate": 0.00012293882978723402, + "loss": 0.349, + "step": 27230 + }, + { + "epoch": 23.83, + "learning_rate": 0.00012287234042553192, + "loss": 0.266, + "step": 27240 + }, + { + "epoch": 23.84, + "learning_rate": 0.0001228058510638298, + "loss": 0.4199, + "step": 27250 + }, + { + "epoch": 23.85, + "learning_rate": 0.00012273936170212766, + "loss": 0.2909, + "step": 27260 + }, + { + "epoch": 23.86, + "learning_rate": 0.00012267287234042553, + "loss": 0.3478, + "step": 27270 + }, + { + "epoch": 23.87, + "learning_rate": 0.0001226063829787234, + "loss": 0.3861, + "step": 27280 + }, + { + "epoch": 23.88, + "learning_rate": 0.00012253989361702127, + "loss": 0.3052, + "step": 27290 + }, + { + "epoch": 23.88, + "learning_rate": 0.00012247340425531914, + "loss": 0.3957, + "step": 27300 + }, + { + "epoch": 23.89, + "learning_rate": 0.000122406914893617, + "loss": 0.2195, + "step": 27310 + }, + { + "epoch": 23.9, + "learning_rate": 0.00012234042553191488, + "loss": 0.4105, + "step": 27320 + }, + { + "epoch": 23.91, + "learning_rate": 0.00012227393617021275, + "loss": 0.3528, + "step": 27330 + }, + { + "epoch": 23.92, + "learning_rate": 0.00012220744680851062, + "loss": 0.2182, + "step": 27340 + }, + { + "epoch": 23.93, + "learning_rate": 0.0001221409574468085, + "loss": 0.3753, + "step": 27350 + }, + { + "epoch": 23.94, + "learning_rate": 0.00012207446808510636, + "loss": 0.2714, + "step": 27360 + }, + { + "epoch": 23.95, + "learning_rate": 0.00012200797872340424, + "loss": 0.4577, + "step": 27370 + }, + { + "epoch": 23.95, + "learning_rate": 0.00012194148936170211, + "loss": 0.3986, + "step": 27380 + }, + { + "epoch": 23.96, + "learning_rate": 0.000121875, + "loss": 0.2771, + "step": 27390 + }, + { + "epoch": 23.97, + "learning_rate": 0.00012180851063829786, + "loss": 0.4185, + "step": 27400 + }, + { + "epoch": 23.98, + "learning_rate": 0.00012174202127659573, + "loss": 0.3425, + "step": 27410 + }, + { + "epoch": 23.99, + "learning_rate": 0.0001216755319148936, + "loss": 0.3918, + "step": 27420 + }, + { + "epoch": 24.0, + "learning_rate": 0.00012160904255319149, + "loss": 0.3223, + "step": 27430 + }, + { + "epoch": 24.01, + "learning_rate": 0.00012154255319148936, + "loss": 0.462, + "step": 27440 + }, + { + "epoch": 24.02, + "learning_rate": 0.00012147606382978723, + "loss": 0.2669, + "step": 27450 + }, + { + "epoch": 24.02, + "learning_rate": 0.0001214095744680851, + "loss": 0.2796, + "step": 27460 + }, + { + "epoch": 24.03, + "learning_rate": 0.00012134308510638298, + "loss": 0.3234, + "step": 27470 + }, + { + "epoch": 24.04, + "learning_rate": 0.00012127659574468084, + "loss": 0.2189, + "step": 27480 + }, + { + "epoch": 24.05, + "learning_rate": 0.0001212101063829787, + "loss": 0.3613, + "step": 27490 + }, + { + "epoch": 24.06, + "learning_rate": 0.00012114361702127658, + "loss": 0.2877, + "step": 27500 + }, + { + "epoch": 24.07, + "learning_rate": 0.00012107712765957445, + "loss": 0.2961, + "step": 27510 + }, + { + "epoch": 24.08, + "learning_rate": 0.00012101063829787233, + "loss": 0.3661, + "step": 27520 + }, + { + "epoch": 24.09, + "learning_rate": 0.0001209441489361702, + "loss": 0.2302, + "step": 27530 + }, + { + "epoch": 24.09, + "learning_rate": 0.00012087765957446807, + "loss": 0.3697, + "step": 27540 + }, + { + "epoch": 24.1, + "learning_rate": 0.00012081117021276594, + "loss": 0.305, + "step": 27550 + }, + { + "epoch": 24.11, + "learning_rate": 0.00012074468085106382, + "loss": 0.2548, + "step": 27560 + }, + { + "epoch": 24.12, + "learning_rate": 0.00012067819148936169, + "loss": 0.2987, + "step": 27570 + }, + { + "epoch": 24.13, + "learning_rate": 0.00012061170212765956, + "loss": 0.2833, + "step": 27580 + }, + { + "epoch": 24.14, + "learning_rate": 0.00012054521276595743, + "loss": 0.3481, + "step": 27590 + }, + { + "epoch": 24.15, + "learning_rate": 0.00012047872340425532, + "loss": 0.2869, + "step": 27600 + }, + { + "epoch": 24.15, + "eval_cer1": 0.26882954660544883, + "eval_cer2": 0.24485643970467597, + "eval_cer3": 0.2234563868016988, + "eval_cer4": 0.22144949933996588, + "eval_cer5": 0.24883227176220807, + "eval_loss": 1.0210694074630737, + "eval_runtime": 1390.8693, + "eval_samples_per_second": 6.298, + "step": 27600 } ], "max_steps": 45720, "num_train_epochs": 40, - "total_flos": 9.31203772819588e+19, + "total_flos": 1.601241517283e+20, "trial_name": null, "trial_params": null }