diff --git "a/trainer_state.json" "b/trainer_state.json" new file mode 100644--- /dev/null +++ "b/trainer_state.json" @@ -0,0 +1,28616 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 101.8409714061888, + "global_step": 260000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.2, + "learning_rate": 6.25e-06, + "loss": 5.8333, + "step": 500 + }, + { + "epoch": 0.2, + "eval_bleu_bleu": 0.0011348604048199084, + "eval_bleu_brevity_penalty": 0.4414813871102664, + "eval_bleu_length_ratio": 0.5501701786561132, + "eval_bleu_precisions": [ + 0.14443071383892475, + 0.005122277968951115, + 0.0007111797456008453, + 8.298853572656463e-05 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 131094, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 1.8938612539672754, + "eval_chrf_word_order": 2, + "eval_loss": 5.333437919616699, + "eval_meteor": 0.027928954060867005, + "eval_runtime": 941.5516, + "eval_samples_per_second": 18.266, + "eval_scarebleu_bp": 0.9852687390578014, + "eval_scarebleu_counts": [ + 37718, + 1353, + 89, + 8 + ], + "eval_scarebleu_precisions": [ + 15.269147157529117, + 0.5879183432261205, + 0.04167622722441009, + 0.004050776483217127 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 0.19439913164712938, + "eval_scarebleu_sys_len": 247021, + "eval_scarebleu_totals": [ + 247021, + 230134, + 213551, + 197493 + ], + "eval_steps_per_second": 0.571, + "eval_ter_num_edits": 216339, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 99.0703808690794, + "step": 500 + }, + { + "epoch": 0.39, + "learning_rate": 1.25e-05, + "loss": 5.3215, + "step": 1000 + }, + { + "epoch": 0.39, + "eval_bleu_bleu": 0.004067854053505411, + "eval_bleu_brevity_penalty": 0.4362692697553245, + "eval_bleu_length_ratio": 0.5465987350962527, + "eval_bleu_precisions": [ + 0.1365831561005198, + 0.013658743183863625, + 0.006191791512214156, + 0.0006543630260654606 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 130243, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 3.635601016744266, + "eval_chrf_word_order": 2, + "eval_loss": 5.1802873611450195, + "eval_meteor": 0.04689638563159233, + "eval_runtime": 941.3581, + "eval_samples_per_second": 18.269, + "eval_scarebleu_bp": 0.9776506737349471, + "eval_scarebleu_counts": [ + 35175, + 2218, + 613, + 55 + ], + "eval_scarebleu_precisions": [ + 14.348592267465103, + 0.9717968602811989, + 0.2894677193910317, + 0.02809476620046382 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 0.567330707496034, + "eval_scarebleu_sys_len": 245146, + "eval_scarebleu_totals": [ + 245146, + 228237, + 211768, + 195766 + ], + "eval_steps_per_second": 0.572, + "eval_ter_num_edits": 217130, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 99.43261177181742, + "step": 1000 + }, + { + "epoch": 0.59, + "learning_rate": 1.8750000000000002e-05, + "loss": 5.1406, + "step": 1500 + }, + { + "epoch": 0.59, + "eval_bleu_bleu": 0.005622999683564658, + "eval_bleu_brevity_penalty": 0.5770406320341732, + "eval_bleu_length_ratio": 0.6452268139449973, + "eval_bleu_precisions": [ + 0.1307758351545426, + 0.013514008155257358, + 0.006083618459484269, + 0.000838635049161365 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 153744, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 4.325666048045834, + "eval_chrf_word_order": 2, + "eval_loss": 5.029767036437988, + "eval_meteor": 0.05282028973915344, + "eval_runtime": 931.3088, + "eval_samples_per_second": 18.466, + "eval_scarebleu_bp": 0.999345583710839, + "eval_scarebleu_counts": [ + 33183, + 2613, + 748, + 92 + ], + "eval_scarebleu_precisions": [ + 13.245490434012046, + 1.1196428112332781, + 0.3457376738510462, + 0.04609079887378135 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 0.6967754135830652, + "eval_scarebleu_sys_len": 250523, + "eval_scarebleu_totals": [ + 250523, + 233378, + 216349, + 199606 + ], + "eval_steps_per_second": 0.578, + "eval_ter_num_edits": 216728, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 99.24851970746764, + "step": 1500 + }, + { + "epoch": 0.78, + "learning_rate": 2.5e-05, + "loss": 4.9824, + "step": 2000 + }, + { + "epoch": 0.78, + "eval_bleu_bleu": 0.007154325346405612, + "eval_bleu_brevity_penalty": 0.7375275459204113, + "eval_bleu_length_ratio": 0.7666055338489753, + "eval_bleu_precisions": [ + 0.13913371946612943, + 0.01332414843282635, + 0.005381848553838693, + 0.000887479709331432 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 182666, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 5.680818746248048, + "eval_chrf_word_order": 2, + "eval_loss": 4.882014274597168, + "eval_meteor": 0.06334297999687093, + "eval_runtime": 932.9841, + "eval_samples_per_second": 18.433, + "eval_scarebleu_bp": 1.0, + "eval_scarebleu_counts": [ + 38444, + 3216, + 827, + 121 + ], + "eval_scarebleu_precisions": [ + 14.629004577747505, + 1.3093609536837991, + 0.361931937539388, + 0.05719498763926507 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 0.79353257577865, + "eval_scarebleu_sys_len": 262793, + "eval_scarebleu_totals": [ + 262793, + 245616, + 228496, + 211557 + ], + "eval_steps_per_second": 0.577, + "eval_ter_num_edits": 216276, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 99.04153062018877, + "step": 2000 + }, + { + "epoch": 0.98, + "learning_rate": 3.125e-05, + "loss": 4.8361, + "step": 2500 + }, + { + "epoch": 0.98, + "eval_bleu_bleu": 0.008206004762224288, + "eval_bleu_brevity_penalty": 0.7385647205228717, + "eval_bleu_length_ratio": 0.767432295754137, + "eval_bleu_precisions": [ + 0.14559533639938096, + 0.014829881880021005, + 0.0060025706075920405, + 0.0011758458504020635 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 182863, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 6.2952483534156345, + "eval_chrf_word_order": 2, + "eval_loss": 4.732661247253418, + "eval_meteor": 0.06864002773775764, + "eval_runtime": 922.3604, + "eval_samples_per_second": 18.646, + "eval_scarebleu_bp": 1.0, + "eval_scarebleu_counts": [ + 39953, + 3549, + 923, + 164 + ], + "eval_scarebleu_precisions": [ + 15.04118603740626, + 1.4285139269038802, + 0.3990505795528731, + 0.07654537647256501 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 0.9000743131546074, + "eval_scarebleu_sys_len": 265624, + "eval_scarebleu_totals": [ + 265624, + 248440, + 231299, + 214252 + ], + "eval_steps_per_second": 0.583, + "eval_ter_num_edits": 214601, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 98.27448035206461, + "step": 2500 + }, + { + "epoch": 1.18, + "learning_rate": 3.7500000000000003e-05, + "loss": 4.6971, + "step": 3000 + }, + { + "epoch": 1.18, + "eval_bleu_bleu": 0.008648880647271552, + "eval_bleu_brevity_penalty": 0.7250048488437403, + "eval_bleu_length_ratio": 0.7566718007042165, + "eval_bleu_precisions": [ + 0.15530868168985962, + 0.015964392782917364, + 0.006245890861275477, + 0.0013077762387117243 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 180299, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 6.484032334647311, + "eval_chrf_word_order": 2, + "eval_loss": 4.573549270629883, + "eval_meteor": 0.07222434356712659, + "eval_runtime": 928.9927, + "eval_samples_per_second": 18.513, + "eval_scarebleu_bp": 0.9786534130365887, + "eval_scarebleu_counts": [ + 40450, + 3708, + 959, + 178 + ], + "eval_scarebleu_precisions": [ + 16.48382995370672, + 1.6248477253008247, + 0.45433226422334766, + 0.09170530654301906 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 1.0058625170121347, + "eval_scarebleu_sys_len": 245392, + "eval_scarebleu_totals": [ + 245392, + 228206, + 211079, + 194100 + ], + "eval_steps_per_second": 0.579, + "eval_ter_num_edits": 210733, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 96.50316665827108, + "step": 3000 + }, + { + "epoch": 1.37, + "learning_rate": 4.375e-05, + "loss": 4.549, + "step": 3500 + }, + { + "epoch": 1.37, + "eval_bleu_bleu": 0.009818227703292402, + "eval_bleu_brevity_penalty": 0.8054146329598101, + "eval_bleu_length_ratio": 0.8220993037573601, + "eval_bleu_precisions": [ + 0.16576734783474315, + 0.017079572227227703, + 0.006065782795459328, + 0.0012858535371342058 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 195889, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 7.914892476951904, + "eval_chrf_word_order": 2, + "eval_loss": 4.403231620788574, + "eval_meteor": 0.08007869997330906, + "eval_runtime": 917.375, + "eval_samples_per_second": 18.747, + "eval_scarebleu_bp": 1.0, + "eval_scarebleu_counts": [ + 45437, + 4346, + 1064, + 205 + ], + "eval_scarebleu_precisions": [ + 17.567933311681283, + 1.8000331345261762, + 0.4744027608100516, + 0.09892915224955241 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 1.103743520939276, + "eval_scarebleu_sys_len": 258636, + "eval_scarebleu_totals": [ + 258636, + 241440, + 224282, + 207219 + ], + "eval_steps_per_second": 0.586, + "eval_ter_num_edits": 208878, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 95.65368710760227, + "step": 3500 + }, + { + "epoch": 1.57, + "learning_rate": 5e-05, + "loss": 4.3821, + "step": 4000 + }, + { + "epoch": 1.57, + "eval_bleu_bleu": 0.01033170687846357, + "eval_bleu_brevity_penalty": 0.7248241535921023, + "eval_bleu_length_ratio": 0.7565291108322597, + "eval_bleu_precisions": [ + 0.18522730424652595, + 0.02151183825648636, + 0.006967185038021511, + 0.0014870233973837681 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 180265, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 8.03687886465491, + "eval_chrf_word_order": 2, + "eval_loss": 4.259134769439697, + "eval_meteor": 0.08335491930719796, + "eval_runtime": 906.3223, + "eval_samples_per_second": 18.976, + "eval_scarebleu_bp": 1.0, + "eval_scarebleu_counts": [ + 47114, + 5075, + 1138, + 223 + ], + "eval_scarebleu_precisions": [ + 18.784887244426017, + 2.172368330936237, + 0.5256739528094455, + 0.11180130451566973 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 1.2444468312384684, + "eval_scarebleu_sys_len": 250808, + "eval_scarebleu_totals": [ + 250808, + 233616, + 216484, + 199461 + ], + "eval_steps_per_second": 0.594, + "eval_ter_num_edits": 205711, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 94.20338967527442, + "step": 4000 + }, + { + "epoch": 1.76, + "learning_rate": 4.99506514015002e-05, + "loss": 4.2615, + "step": 4500 + }, + { + "epoch": 1.76, + "eval_bleu_bleu": 0.011221915801333112, + "eval_bleu_brevity_penalty": 0.7871176894249504, + "eval_bleu_length_ratio": 0.8068566680236193, + "eval_bleu_precisions": [ + 0.18087767935627833, + 0.022751939312929133, + 0.006939607684222524, + 0.001446675129243403 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 192257, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 9.193932518263841, + "eval_chrf_word_order": 2, + "eval_loss": 4.150329113006592, + "eval_meteor": 0.08732889274005008, + "eval_runtime": 898.165, + "eval_samples_per_second": 19.148, + "eval_scarebleu_bp": 1.0, + "eval_scarebleu_counts": [ + 48798, + 5630, + 1253, + 231 + ], + "eval_scarebleu_precisions": [ + 18.280443993241953, + 2.2542903590047487, + 0.5387138797287944, + 0.10718412004621446 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 1.2419991577061507, + "eval_scarebleu_sys_len": 266941, + "eval_scarebleu_totals": [ + 266941, + 249746, + 232591, + 215517 + ], + "eval_steps_per_second": 0.599, + "eval_ter_num_edits": 205974, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 94.32382801588138, + "step": 4500 + }, + { + "epoch": 1.96, + "learning_rate": 4.99013028030004e-05, + "loss": 4.1476, + "step": 5000 + }, + { + "epoch": 1.96, + "eval_bleu_bleu": 0.012034312603994297, + "eval_bleu_brevity_penalty": 0.7678815320837896, + "eval_bleu_length_ratio": 0.791064256606751, + "eval_bleu_precisions": [ + 0.1967542733455707, + 0.0247343841214244, + 0.007497584039744978, + 0.0016533379947267987 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 188494, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 9.527733406518104, + "eval_chrf_word_order": 2, + "eval_loss": 4.0423665046691895, + "eval_meteor": 0.0921227509334498, + "eval_runtime": 909.7274, + "eval_samples_per_second": 18.905, + "eval_scarebleu_bp": 0.953183258545739, + "eval_scarebleu_counts": [ + 49996, + 5820, + 1317, + 266 + ], + "eval_scarebleu_precisions": [ + 20.899852435236625, + 2.621350040311139, + 0.6428058940956546, + 0.14157973174366617 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 1.4243400930990766, + "eval_scarebleu_sys_len": 239217, + "eval_scarebleu_totals": [ + 239217, + 222023, + 204883, + 187880 + ], + "eval_steps_per_second": 0.591, + "eval_ter_num_edits": 202928, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 92.9289413790419, + "step": 5000 + }, + { + "epoch": 2.15, + "learning_rate": 4.98519542045006e-05, + "loss": 4.0856, + "step": 5500 + }, + { + "epoch": 2.15, + "eval_bleu_bleu": 0.012492220680183533, + "eval_bleu_brevity_penalty": 0.7201552949550095, + "eval_bleu_length_ratio": 0.7528485514879616, + "eval_bleu_precisions": [ + 0.20437264476999575, + 0.027559249303312043, + 0.008346946230778245, + 0.0019259109090767324 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 179388, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 9.87133389958056, + "eval_chrf_word_order": 2, + "eval_loss": 3.9707274436950684, + "eval_meteor": 0.0939261362821297, + "eval_runtime": 925.4872, + "eval_samples_per_second": 18.583, + "eval_scarebleu_bp": 0.9520301458378654, + "eval_scarebleu_counts": [ + 50371, + 6198, + 1433, + 297 + ], + "eval_scarebleu_precisions": [ + 21.080936298081955, + 2.795052063368944, + 0.7003773142265058, + 0.15831472113688094 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 1.5220677797630346, + "eval_scarebleu_sys_len": 238941, + "eval_scarebleu_totals": [ + 238941, + 221749, + 204604, + 187601 + ], + "eval_steps_per_second": 0.581, + "eval_ter_num_edits": 201820, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 92.4215433509335, + "step": 5500 + }, + { + "epoch": 2.35, + "learning_rate": 4.980260560600079e-05, + "loss": 3.9932, + "step": 6000 + }, + { + "epoch": 2.35, + "eval_bleu_bleu": 0.012810802247874219, + "eval_bleu_brevity_penalty": 0.7684221434938174, + "eval_bleu_length_ratio": 0.7915049165054411, + "eval_bleu_precisions": [ + 0.20240828424328866, + 0.026796340808849267, + 0.007953278539759912, + 0.0017908361603307952 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 188599, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 10.768086144078948, + "eval_chrf_word_order": 2, + "eval_loss": 3.9121487140655518, + "eval_meteor": 0.09866190439618464, + "eval_runtime": 913.3421, + "eval_samples_per_second": 18.83, + "eval_scarebleu_bp": 0.9691698122333106, + "eval_scarebleu_counts": [ + 51603, + 6362, + 1472, + 296 + ], + "eval_scarebleu_precisions": [ + 21.22925023141006, + 2.8165397556224545, + 0.7052172663249173, + 0.15440631813961253 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 1.5481374436861277, + "eval_scarebleu_sys_len": 243075, + "eval_scarebleu_totals": [ + 243075, + 225880, + 208730, + 191702 + ], + "eval_steps_per_second": 0.589, + "eval_ter_num_edits": 201491, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 92.27088094006018, + "step": 6000 + }, + { + "epoch": 2.55, + "learning_rate": 4.975325700750099e-05, + "loss": 3.9638, + "step": 6500 + }, + { + "epoch": 2.55, + "eval_bleu_bleu": 0.013649772527377455, + "eval_bleu_brevity_penalty": 0.7605589943270334, + "eval_bleu_length_ratio": 0.7851132495939633, + "eval_bleu_precisions": [ + 0.21057751929697022, + 0.028660058391410812, + 0.008463371210137719, + 0.0020311292637156418 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 187076, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 11.066856948890994, + "eval_chrf_word_order": 2, + "eval_loss": 3.8658156394958496, + "eval_meteor": 0.10154066669781668, + "eval_runtime": 898.3145, + "eval_samples_per_second": 19.145, + "eval_scarebleu_bp": 0.9138312391382774, + "eval_scarebleu_counts": [ + 52220, + 6731, + 1569, + 331 + ], + "eval_scarebleu_precisions": [ + 22.707803361381078, + 3.1634058192379815, + 0.8019627386337499, + 0.18527744037257 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 1.6517438249364063, + "eval_scarebleu_sys_len": 229965, + "eval_scarebleu_totals": [ + 229965, + 212777, + 195645, + 178651 + ], + "eval_steps_per_second": 0.599, + "eval_ter_num_edits": 200268, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 91.71081975921491, + "step": 6500 + }, + { + "epoch": 2.74, + "learning_rate": 4.970390840900119e-05, + "loss": 3.9265, + "step": 7000 + }, + { + "epoch": 2.74, + "eval_bleu_bleu": 0.013652962355308272, + "eval_bleu_brevity_penalty": 0.7864172690870728, + "eval_bleu_length_ratio": 0.8062775150139123, + "eval_bleu_precisions": [ + 0.20498232866088206, + 0.028531738772523553, + 0.008225862669919832, + 0.0018882925859670045 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 192119, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 11.526476342650843, + "eval_chrf_word_order": 2, + "eval_loss": 3.825770139694214, + "eval_meteor": 0.10311187398374413, + "eval_runtime": 898.7517, + "eval_samples_per_second": 19.135, + "eval_scarebleu_bp": 0.966786226489416, + "eval_scarebleu_counts": [ + 52763, + 6952, + 1596, + 330 + ], + "eval_scarebleu_precisions": [ + 21.758297044074954, + 3.085595082221877, + 0.7667400098004362, + 0.1726555469518448 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 1.6692776503053472, + "eval_scarebleu_sys_len": 242496, + "eval_scarebleu_totals": [ + 242496, + 225305, + 208154, + 191132 + ], + "eval_steps_per_second": 0.599, + "eval_ter_num_edits": 200560, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 91.84453837312073, + "step": 7000 + }, + { + "epoch": 2.94, + "learning_rate": 4.9654559810501384e-05, + "loss": 3.8679, + "step": 7500 + }, + { + "epoch": 2.94, + "eval_bleu_bleu": 0.0142128995216716, + "eval_bleu_brevity_penalty": 0.7885731364466368, + "eval_bleu_length_ratio": 0.8080611384133726, + "eval_bleu_precisions": [ + 0.21041424297822836, + 0.02963634601018482, + 0.00860134866113467, + 0.0019674173047798333 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 192544, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 11.689091771943092, + "eval_chrf_word_order": 2, + "eval_loss": 3.7899129390716553, + "eval_meteor": 0.10594887815472302, + "eval_runtime": 920.6525, + "eval_samples_per_second": 18.68, + "eval_scarebleu_bp": 0.9422575671571348, + "eval_scarebleu_counts": [ + 53549, + 7131, + 1661, + 343 + ], + "eval_scarebleu_precisions": [ + 22.63137430583144, + 3.249798340237617, + 0.8211187186395432, + 0.18513920525082853 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 1.7230090393206174, + "eval_scarebleu_sys_len": 236614, + "eval_scarebleu_totals": [ + 236614, + 219429, + 202285, + 185266 + ], + "eval_steps_per_second": 0.584, + "eval_ter_num_edits": 199706, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 91.45345722149206, + "step": 7500 + }, + { + "epoch": 3.13, + "learning_rate": 4.960521121200158e-05, + "loss": 3.8253, + "step": 8000 + }, + { + "epoch": 3.13, + "eval_bleu_bleu": 0.014506178068679876, + "eval_bleu_brevity_penalty": 0.7796727551084742, + "eval_bleu_length_ratio": 0.8007168067685361, + "eval_bleu_precisions": [ + 0.21547847416585428, + 0.030898261540765658, + 0.008876647196410997, + 0.002027569209606236 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 190794, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 11.948708760062607, + "eval_chrf_word_order": 2, + "eval_loss": 3.7546181678771973, + "eval_meteor": 0.10781681918079293, + "eval_runtime": 904.137, + "eval_samples_per_second": 19.021, + "eval_scarebleu_bp": 0.9517374883175079, + "eval_scarebleu_counts": [ + 54775, + 7460, + 1753, + 361 + ], + "eval_scarebleu_precisions": [ + 22.930786910089545, + 3.3652262956797894, + 0.8570953610263632, + 0.19253333333333333 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 1.7978740041619092, + "eval_scarebleu_sys_len": 238871, + "eval_scarebleu_totals": [ + 238871, + 221679, + 204528, + 187500 + ], + "eval_steps_per_second": 0.595, + "eval_ter_num_edits": 198990, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 91.12557185314766, + "step": 8000 + }, + { + "epoch": 3.33, + "learning_rate": 4.955586261350178e-05, + "loss": 3.8025, + "step": 8500 + }, + { + "epoch": 3.33, + "eval_bleu_bleu": 0.01520281415151016, + "eval_bleu_brevity_penalty": 0.7891811955804295, + "eval_bleu_length_ratio": 0.8085647497261613, + "eval_bleu_precisions": [ + 0.2209909479715982, + 0.03202110805912992, + 0.009144358347700332, + 0.0021282613306936294 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 192664, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 12.378501866787927, + "eval_chrf_word_order": 2, + "eval_loss": 3.7166264057159424, + "eval_meteor": 0.11112579471209312, + "eval_runtime": 900.1687, + "eval_samples_per_second": 19.105, + "eval_scarebleu_bp": 0.9444029215734185, + "eval_scarebleu_counts": [ + 55814, + 7578, + 1770, + 382 + ], + "eval_scarebleu_precisions": [ + 23.537995048983017, + 3.4455321296553105, + 0.8728499289884804, + 0.20564943769414223 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 1.8447203621190398, + "eval_scarebleu_sys_len": 237123, + "eval_scarebleu_totals": [ + 237123, + 219937, + 202784, + 185753 + ], + "eval_steps_per_second": 0.598, + "eval_ter_num_edits": 198179, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 90.75418214123799, + "step": 8500 + }, + { + "epoch": 3.53, + "learning_rate": 4.950651401500197e-05, + "loss": 3.773, + "step": 9000 + }, + { + "epoch": 3.53, + "eval_bleu_bleu": 0.015648557295457687, + "eval_bleu_brevity_penalty": 0.8411648027173251, + "eval_bleu_length_ratio": 0.8525384108545025, + "eval_bleu_precisions": [ + 0.2198954425968042, + 0.031664255637237765, + 0.00873711645539628, + 0.001968879845650356 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 203142, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 12.727405120743501, + "eval_chrf_word_order": 2, + "eval_loss": 3.687321424484253, + "eval_meteor": 0.11597399678187685, + "eval_runtime": 903.2015, + "eval_samples_per_second": 19.041, + "eval_scarebleu_bp": 0.9492424142214005, + "eval_scarebleu_counts": [ + 57026, + 7904, + 1860, + 394 + ], + "eval_scarebleu_precisions": [ + 23.932850697723218, + 3.5751117222413202, + 0.9120642563979346, + 0.2108079186730872 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 1.9117285972562006, + "eval_scarebleu_sys_len": 238275, + "eval_scarebleu_totals": [ + 238275, + 221084, + 203933, + 186900 + ], + "eval_steps_per_second": 0.596, + "eval_ter_num_edits": 197943, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 90.64610819301274, + "step": 9000 + }, + { + "epoch": 3.72, + "learning_rate": 4.945716541650217e-05, + "loss": 3.7521, + "step": 9500 + }, + { + "epoch": 3.72, + "eval_bleu_bleu": 0.015458530197767956, + "eval_bleu_brevity_penalty": 0.7785290655033739, + "eval_bleu_length_ratio": 0.799776732317997, + "eval_bleu_precisions": [ + 0.22124678595791572, + 0.03322682600470632, + 0.009535572806338277, + 0.002217485844689875 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 190570, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 12.571450080415957, + "eval_chrf_word_order": 2, + "eval_loss": 3.67626953125, + "eval_meteor": 0.1124764601648934, + "eval_runtime": 884.6944, + "eval_samples_per_second": 19.439, + "eval_scarebleu_bp": 0.921140556631552, + "eval_scarebleu_counts": [ + 55280, + 7813, + 1870, + 410 + ], + "eval_scarebleu_precisions": [ + 23.862763211285603, + 3.642899772464471, + 0.9476799578358436, + 0.22736977534757075 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 1.9163132387685478, + "eval_scarebleu_sys_len": 231658, + "eval_scarebleu_totals": [ + 231658, + 214472, + 197324, + 180323 + ], + "eval_steps_per_second": 0.608, + "eval_ter_num_edits": 197467, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 90.42812853472792, + "step": 9500 + }, + { + "epoch": 3.92, + "learning_rate": 4.940781681800237e-05, + "loss": 3.7293, + "step": 10000 + }, + { + "epoch": 3.92, + "eval_bleu_bleu": 0.01600709306450972, + "eval_bleu_brevity_penalty": 0.7803921498574778, + "eval_bleu_length_ratio": 0.8013085500610628, + "eval_bleu_precisions": [ + 0.2247518789116715, + 0.03434800375249639, + 0.009947389927469609, + 0.002305071156544398 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 190935, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 13.009074295896673, + "eval_chrf_word_order": 2, + "eval_loss": 3.645359754562378, + "eval_meteor": 0.11533202996658069, + "eval_runtime": 893.8498, + "eval_samples_per_second": 19.24, + "eval_scarebleu_bp": 0.9358972738207232, + "eval_scarebleu_counts": [ + 56283, + 8093, + 1959, + 436 + ], + "eval_scarebleu_precisions": [ + 23.93890545316893, + 3.71362887572444, + 0.975714228792286, + 0.2372763289651269 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 1.9934169319703343, + "eval_scarebleu_sys_len": 235111, + "eval_scarebleu_totals": [ + 235111, + 217927, + 200776, + 183752 + ], + "eval_steps_per_second": 0.602, + "eval_ter_num_edits": 196939, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 90.18633597259684, + "step": 10000 + }, + { + "epoch": 4.11, + "learning_rate": 4.935846821950257e-05, + "loss": 3.6993, + "step": 10500 + }, + { + "epoch": 4.11, + "eval_bleu_bleu": 0.016498035092930748, + "eval_bleu_brevity_penalty": 0.7874221007610812, + "eval_bleu_length_ratio": 0.8071084736800138, + "eval_bleu_precisions": [ + 0.2285965359276611, + 0.03548282103844638, + 0.010126454095517778, + 0.002346136671321137 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 192317, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 13.157968683776444, + "eval_chrf_word_order": 2, + "eval_loss": 3.6208066940307617, + "eval_meteor": 0.11796826909316199, + "eval_runtime": 885.4726, + "eval_samples_per_second": 19.422, + "eval_scarebleu_bp": 0.9238909352286672, + "eval_scarebleu_counts": [ + 57101, + 8409, + 2020, + 457 + ], + "eval_scarebleu_precisions": [ + 24.58092622407425, + 3.9091990999869832, + 1.0204030086734255, + 0.2525615376963293 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 2.060995057452842, + "eval_scarebleu_sys_len": 232298, + "eval_scarebleu_totals": [ + 232298, + 215108, + 197961, + 180946 + ], + "eval_steps_per_second": 0.608, + "eval_ter_num_edits": 196288, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 89.88821673406024, + "step": 10500 + }, + { + "epoch": 4.31, + "learning_rate": 4.9309119621002765e-05, + "loss": 3.6682, + "step": 11000 + }, + { + "epoch": 4.31, + "eval_bleu_bleu": 0.01669847704462812, + "eval_bleu_brevity_penalty": 0.7790959305591282, + "eval_bleu_length_ratio": 0.8002425727823266, + "eval_bleu_precisions": [ + 0.22830801181030097, + 0.036202772414190613, + 0.010321342925659472, + 0.002473685720021797 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 190681, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 13.203408641067638, + "eval_chrf_word_order": 2, + "eval_loss": 3.5980210304260254, + "eval_meteor": 0.11794395420402942, + "eval_runtime": 905.3196, + "eval_samples_per_second": 18.997, + "eval_scarebleu_bp": 0.935353855272948, + "eval_scarebleu_counts": [ + 57233, + 8586, + 2077, + 483 + ], + "eval_scarebleu_precisions": [ + 24.356230025150754, + 3.942203060648218, + 1.0351306497351123, + 0.2630145937704204 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 2.1149833789883785, + "eval_scarebleu_sys_len": 234983, + "eval_scarebleu_totals": [ + 234983, + 217797, + 200651, + 183640 + ], + "eval_steps_per_second": 0.594, + "eval_ter_num_edits": 196263, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 89.8767682225957, + "step": 11000 + }, + { + "epoch": 4.5, + "learning_rate": 4.925977102250297e-05, + "loss": 3.662, + "step": 11500 + }, + { + "epoch": 4.5, + "eval_bleu_bleu": 0.016988075857737806, + "eval_bleu_brevity_penalty": 0.7735135679447839, + "eval_bleu_length_ratio": 0.7956639065968886, + "eval_bleu_precisions": [ + 0.23425813597763595, + 0.03766328685120304, + 0.010634049569742876, + 0.0024796674498463764 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 189590, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 13.544439612658667, + "eval_chrf_word_order": 2, + "eval_loss": 3.5758237838745117, + "eval_meteor": 0.12021456762834692, + "eval_runtime": 897.6325, + "eval_samples_per_second": 19.159, + "eval_scarebleu_bp": 0.9462665659887197, + "eval_scarebleu_counts": [ + 58287, + 8860, + 2136, + 488 + ], + "eval_scarebleu_precisions": [ + 24.535076568195784, + 4.020474470440891, + 1.0511242009536885, + 0.26212601385830153 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 2.16058181718745, + "eval_scarebleu_sys_len": 237566, + "eval_scarebleu_totals": [ + 237566, + 220372, + 203211, + 186170 + ], + "eval_steps_per_second": 0.599, + "eval_ter_num_edits": 195759, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 89.64596623147058, + "step": 11500 + }, + { + "epoch": 4.7, + "learning_rate": 4.921042242400316e-05, + "loss": 3.6592, + "step": 12000 + }, + { + "epoch": 4.7, + "eval_bleu_bleu": 0.017698090136047593, + "eval_bleu_brevity_penalty": 0.8005238061265058, + "eval_bleu_length_ratio": 0.8180032650800112, + "eval_bleu_precisions": [ + 0.23410444659925198, + 0.03747404669063655, + 0.010629752096994153, + 0.0025617999429164142 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 194913, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 13.837216209670386, + "eval_chrf_word_order": 2, + "eval_loss": 3.5561466217041016, + "eval_meteor": 0.1227589138731498, + "eval_runtime": 889.8677, + "eval_samples_per_second": 19.326, + "eval_scarebleu_bp": 0.9199953770133047, + "eval_scarebleu_counts": [ + 58611, + 8839, + 2164, + 515 + ], + "eval_scarebleu_precisions": [ + 25.329743465634074, + 4.126478744362798, + 1.0982374405586597, + 0.28607296804870463 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 2.2023255273471634, + "eval_scarebleu_sys_len": 231392, + "eval_scarebleu_totals": [ + 231392, + 214202, + 197043, + 180024 + ], + "eval_steps_per_second": 0.605, + "eval_ter_num_edits": 195464, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 89.51087379618902, + "step": 12000 + }, + { + "epoch": 4.9, + "learning_rate": 4.9161073825503354e-05, + "loss": 3.6142, + "step": 12500 + }, + { + "epoch": 4.9, + "eval_bleu_bleu": 0.01816699537237565, + "eval_bleu_brevity_penalty": 0.8089954428086782, + "eval_bleu_length_ratio": 0.8251083813512731, + "eval_bleu_precisions": [ + 0.23060333865700944, + 0.03785678852702981, + 0.010882894874686485, + 0.0026766668960297255 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 196606, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 14.002358899592915, + "eval_chrf_word_order": 2, + "eval_loss": 3.5401859283447266, + "eval_meteor": 0.12349231367248499, + "eval_runtime": 878.8045, + "eval_samples_per_second": 19.57, + "eval_scarebleu_bp": 0.9303226530233286, + "eval_scarebleu_counts": [ + 58455, + 9098, + 2252, + 550 + ], + "eval_scarebleu_precisions": [ + 25.00203164229409, + 4.200214211848131, + 1.1290880558327023, + 0.30148880654285526 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 2.2748094964301733, + "eval_scarebleu_sys_len": 233801, + "eval_scarebleu_totals": [ + 233801, + 216608, + 199453, + 182428 + ], + "eval_steps_per_second": 0.612, + "eval_ter_num_edits": 195463, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 89.51041585573044, + "step": 12500 + }, + { + "epoch": 5.09, + "learning_rate": 4.911172522700356e-05, + "loss": 3.6046, + "step": 13000 + }, + { + "epoch": 5.09, + "eval_bleu_bleu": 0.01837209272399148, + "eval_bleu_brevity_penalty": 0.789814283207778, + "eval_bleu_length_ratio": 0.8090893448436497, + "eval_bleu_precisions": [ + 0.23661100996426146, + 0.03908972869541447, + 0.011144627734093979, + 0.0028403470593222732 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 192789, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 14.101331254298541, + "eval_chrf_word_order": 2, + "eval_loss": 3.518184185028076, + "eval_meteor": 0.12390292106368213, + "eval_runtime": 913.311, + "eval_samples_per_second": 18.83, + "eval_scarebleu_bp": 0.9306937752512372, + "eval_scarebleu_counts": [ + 59237, + 9255, + 2266, + 558 + ], + "eval_scarebleu_precisions": [ + 25.32707962785607, + 4.2709799487759295, + 1.1356175985646917, + 0.3057333216446042 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 2.303979940107864, + "eval_scarebleu_sys_len": 233888, + "eval_scarebleu_totals": [ + 233888, + 216695, + 199539, + 182512 + ], + "eval_steps_per_second": 0.589, + "eval_ter_num_edits": 194864, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 89.23610952104008, + "step": 13000 + }, + { + "epoch": 5.29, + "learning_rate": 4.9062376628503753e-05, + "loss": 3.5736, + "step": 13500 + }, + { + "epoch": 5.29, + "eval_bleu_bleu": 0.019068739786263344, + "eval_bleu_brevity_penalty": 0.8173503483952447, + "eval_bleu_length_ratio": 0.8321631364912561, + "eval_bleu_precisions": [ + 0.23633924563889716, + 0.03981379733065331, + 0.01125966769951448, + 0.0027961466242142218 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 198287, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 14.484905865947745, + "eval_chrf_word_order": 2, + "eval_loss": 3.499253034591675, + "eval_meteor": 0.12740758869283744, + "eval_runtime": 884.4893, + "eval_samples_per_second": 19.444, + "eval_scarebleu_bp": 0.9298745762234788, + "eval_scarebleu_counts": [ + 59680, + 9498, + 2362, + 576 + ], + "eval_scarebleu_precisions": [ + 25.537450362864575, + 4.38702644779263, + 1.1848983154578563, + 0.3159436347779344 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 2.366377317850796, + "eval_scarebleu_sys_len": 233696, + "eval_scarebleu_totals": [ + 233696, + 216502, + 199342, + 182311 + ], + "eval_steps_per_second": 0.608, + "eval_ter_num_edits": 194591, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 89.11109177584731, + "step": 13500 + }, + { + "epoch": 5.48, + "learning_rate": 4.901302803000395e-05, + "loss": 3.5641, + "step": 14000 + }, + { + "epoch": 5.48, + "eval_bleu_bleu": 0.018724923648157928, + "eval_bleu_brevity_penalty": 0.7831639440991308, + "eval_bleu_length_ratio": 0.8035915880123721, + "eval_bleu_precisions": [ + 0.23494482423660035, + 0.04076105666613114, + 0.011696725171505301, + 0.0029173859080987774 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 191479, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 14.233889118159285, + "eval_chrf_word_order": 2, + "eval_loss": 3.4971816539764404, + "eval_meteor": 0.12440605757078775, + "eval_runtime": 878.636, + "eval_samples_per_second": 19.574, + "eval_scarebleu_bp": 0.9331816720769291, + "eval_scarebleu_counts": [ + 58799, + 9613, + 2375, + 590 + ], + "eval_scarebleu_precisions": [ + 25.0771947183459, + 4.424306300252673, + 1.1868235105989586, + 0.3222740531151338 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 2.3817715624229914, + "eval_scarebleu_sys_len": 234472, + "eval_scarebleu_totals": [ + 234472, + 217277, + 200114, + 183074 + ], + "eval_steps_per_second": 0.612, + "eval_ter_num_edits": 194656, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 89.1408579056551, + "step": 14000 + }, + { + "epoch": 5.68, + "learning_rate": 4.896367943150415e-05, + "loss": 3.5484, + "step": 14500 + }, + { + "epoch": 5.68, + "eval_bleu_bleu": 0.01918221541521584, + "eval_bleu_brevity_penalty": 0.8072038258863783, + "eval_bleu_length_ratio": 0.8236017441738466, + "eval_bleu_precisions": [ + 0.23617685875452873, + 0.04040657898411103, + 0.01150646350727878, + 0.0029042294134284394 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 196247, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 14.532918637152195, + "eval_chrf_word_order": 2, + "eval_loss": 3.469637155532837, + "eval_meteor": 0.12715430747019119, + "eval_runtime": 897.3111, + "eval_samples_per_second": 19.166, + "eval_scarebleu_bp": 0.9465985640965462, + "eval_scarebleu_counts": [ + 60151, + 9784, + 2429, + 611 + ], + "eval_scarebleu_precisions": [ + 25.311283637358244, + 4.438134205476905, + 1.1948330480294356, + 0.32804840727397677 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 2.438404671265055, + "eval_scarebleu_sys_len": 237645, + "eval_scarebleu_totals": [ + 237645, + 220453, + 203292, + 186253 + ], + "eval_steps_per_second": 0.6, + "eval_ter_num_edits": 194487, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 89.06346596815482, + "step": 14500 + }, + { + "epoch": 5.88, + "learning_rate": 4.891433083300435e-05, + "loss": 3.5408, + "step": 15000 + }, + { + "epoch": 5.88, + "eval_bleu_bleu": 0.019699437876944354, + "eval_bleu_brevity_penalty": 0.8339303450240936, + "eval_bleu_length_ratio": 0.8463062208587412, + "eval_bleu_precisions": [ + 0.23953544880663702, + 0.04014289896241042, + 0.011403230915426037, + 0.0028398132506883386 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 201657, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 14.94538481809081, + "eval_chrf_word_order": 2, + "eval_loss": 3.453136920928955, + "eval_meteor": 0.1314418432131532, + "eval_runtime": 877.4288, + "eval_samples_per_second": 19.6, + "eval_scarebleu_bp": 0.921695491273367, + "eval_scarebleu_counts": [ + 60784, + 9712, + 2414, + 602 + ], + "eval_scarebleu_precisions": [ + 26.224076414984445, + 4.525713433614793, + 1.2226746895196419, + 0.33369548347043304 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 2.43136179902878, + "eval_scarebleu_sys_len": 231787, + "eval_scarebleu_totals": [ + 231787, + 214596, + 197436, + 180404 + ], + "eval_steps_per_second": 0.613, + "eval_ter_num_edits": 193892, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 88.79099139529878, + "step": 15000 + }, + { + "epoch": 6.07, + "learning_rate": 4.886508093170154e-05, + "loss": 3.4962, + "step": 15500 + }, + { + "epoch": 6.07, + "eval_bleu_bleu": 0.02039521285853284, + "eval_bleu_brevity_penalty": 0.8164633659123893, + "eval_bleu_length_ratio": 0.8314119162830128, + "eval_bleu_precisions": [ + 0.24278171502412826, + 0.042152392007296244, + 0.012169283093061738, + 0.0031265326140264837 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 198108, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 15.13089261782855, + "eval_chrf_word_order": 2, + "eval_loss": 3.4371795654296875, + "eval_meteor": 0.13265166421690444, + "eval_runtime": 881.067, + "eval_samples_per_second": 19.52, + "eval_scarebleu_bp": 0.9203097757883734, + "eval_scarebleu_counts": [ + 61139, + 10108, + 2537, + 651 + ], + "eval_scarebleu_precisions": [ + 26.413928671721425, + 4.717368578255675, + 1.2870985744000811, + 0.3615280809023208 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 2.5395437508955796, + "eval_scarebleu_sys_len": 231465, + "eval_scarebleu_totals": [ + 231465, + 214272, + 197110, + 180069 + ], + "eval_steps_per_second": 0.611, + "eval_ter_num_edits": 193570, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 88.64353456763551, + "step": 15500 + }, + { + "epoch": 6.27, + "learning_rate": 4.881573233320174e-05, + "loss": 3.4933, + "step": 16000 + }, + { + "epoch": 6.27, + "eval_bleu_bleu": 0.020373188541894956, + "eval_bleu_brevity_penalty": 0.8228560956703361, + "eval_bleu_length_ratio": 0.8368383281783119, + "eval_bleu_precisions": [ + 0.24148825733070547, + 0.042429531085353, + 0.011965345934811583, + 0.0030651444466199018 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 199401, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 15.158102362555281, + "eval_chrf_word_order": 2, + "eval_loss": 3.423179864883423, + "eval_meteor": 0.13234960450483618, + "eval_runtime": 885.5598, + "eval_samples_per_second": 19.42, + "eval_scarebleu_bp": 0.9518921888779303, + "eval_scarebleu_counts": [ + 61911, + 10296, + 2531, + 642 + ], + "eval_scarebleu_precisions": [ + 25.914159425385503, + 4.643799472295514, + 1.2373623794903885, + 0.3424091309101576 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 2.543612615878307, + "eval_scarebleu_sys_len": 238908, + "eval_scarebleu_totals": [ + 238908, + 221715, + 204548, + 187495 + ], + "eval_steps_per_second": 0.608, + "eval_ter_num_edits": 193419, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 88.57438555838971, + "step": 16000 + }, + { + "epoch": 6.46, + "learning_rate": 4.876638373470194e-05, + "loss": 3.4744, + "step": 16500 + }, + { + "epoch": 6.46, + "eval_bleu_bleu": 0.02046442353337142, + "eval_bleu_brevity_penalty": 0.8016479771043586, + "eval_bleu_length_ratio": 0.8189433395305503, + "eval_bleu_precisions": [ + 0.24500735380783756, + 0.04359798588319921, + 0.012568486122426134, + 0.003163258921432991 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 195137, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 15.169659491612473, + "eval_chrf_word_order": 2, + "eval_loss": 3.412996768951416, + "eval_meteor": 0.13241206884557213, + "eval_runtime": 884.7669, + "eval_samples_per_second": 19.438, + "eval_scarebleu_bp": 0.9345212101171294, + "eval_scarebleu_counts": [ + 61644, + 10438, + 2635, + 672 + ], + "eval_scarebleu_precisions": [ + 26.25528670667456, + 4.79700727042106, + 1.314666892845917, + 0.3664541741420773 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 2.608223466159479, + "eval_scarebleu_sys_len": 234787, + "eval_scarebleu_totals": [ + 234787, + 217594, + 200431, + 183379 + ], + "eval_steps_per_second": 0.608, + "eval_ter_num_edits": 193207, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 88.4773021811704, + "step": 16500 + }, + { + "epoch": 6.66, + "learning_rate": 4.8717035136202136e-05, + "loss": 3.4825, + "step": 17000 + }, + { + "epoch": 6.66, + "eval_bleu_bleu": 0.02093234302488353, + "eval_bleu_brevity_penalty": 0.8329086544280248, + "eval_bleu_length_ratio": 0.8454290978223008, + "eval_bleu_precisions": [ + 0.24358643421627418, + 0.043391188251001335, + 0.012345235744334536, + 0.003057228113177386 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 201448, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 15.546373665292851, + "eval_chrf_word_order": 2, + "eval_loss": 3.3973846435546875, + "eval_meteor": 0.13559044246354832, + "eval_runtime": 903.9168, + "eval_samples_per_second": 19.026, + "eval_scarebleu_bp": 0.935005582574756, + "eval_scarebleu_counts": [ + 62212, + 10629, + 2691, + 669 + ], + "eval_scarebleu_precisions": [ + 26.484348725633353, + 4.882249996555003, + 1.3418167131224787, + 0.36455580319435893 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 2.6368221304281114, + "eval_scarebleu_sys_len": 234901, + "eval_scarebleu_totals": [ + 234901, + 217707, + 200549, + 183511 + ], + "eval_steps_per_second": 0.595, + "eval_ter_num_edits": 193099, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 88.4278446116436, + "step": 17000 + }, + { + "epoch": 6.85, + "learning_rate": 4.8667785234899334e-05, + "loss": 3.4531, + "step": 17500 + }, + { + "epoch": 6.85, + "eval_bleu_bleu": 0.021475531373427198, + "eval_bleu_brevity_penalty": 0.8293332686037754, + "eval_bleu_length_ratio": 0.8423654623361689, + "eval_bleu_precisions": [ + 0.24584740780597655, + 0.043934068927938975, + 0.012718104064864734, + 0.0032731800048194063 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 200718, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 15.584352304811599, + "eval_chrf_word_order": 2, + "eval_loss": 3.3813438415527344, + "eval_meteor": 0.13608827861097164, + "eval_runtime": 880.1349, + "eval_samples_per_second": 19.54, + "eval_scarebleu_bp": 0.9406699968121972, + "eval_scarebleu_counts": [ + 62801, + 10723, + 2706, + 689 + ], + "eval_scarebleu_precisions": [ + 26.583784149882746, + 4.895341139948412, + 1.3404068773869495, + 0.37278910092358636 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 2.671235616119071, + "eval_scarebleu_sys_len": 236238, + "eval_scarebleu_totals": [ + 236238, + 219045, + 201879, + 184823 + ], + "eval_steps_per_second": 0.611, + "eval_ter_num_edits": 192797, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 88.28954659315195, + "step": 17500 + }, + { + "epoch": 7.05, + "learning_rate": 4.861843663639953e-05, + "loss": 3.4446, + "step": 18000 + }, + { + "epoch": 7.05, + "eval_bleu_bleu": 0.021441395564061137, + "eval_bleu_brevity_penalty": 0.8348144584740955, + "eval_bleu_length_ratio": 0.8470658345888643, + "eval_bleu_precisions": [ + 0.24267481841873184, + 0.04404668417774649, + 0.012662459776839817, + 0.003215113691468656 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 201838, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 15.920046243497527, + "eval_chrf_word_order": 2, + "eval_loss": 3.3755526542663574, + "eval_meteor": 0.13568028452387781, + "eval_runtime": 913.7448, + "eval_samples_per_second": 18.821, + "eval_scarebleu_bp": 0.9361816093430438, + "eval_scarebleu_counts": [ + 62169, + 10760, + 2752, + 700 + ], + "eval_scarebleu_precisions": [ + 26.434870608645365, + 4.936119457760855, + 1.370340493760768, + 0.38086739829480226 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 2.689375168974736, + "eval_scarebleu_sys_len": 235178, + "eval_scarebleu_totals": [ + 235178, + 217985, + 200826, + 183791 + ], + "eval_steps_per_second": 0.589, + "eval_ter_num_edits": 193006, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 88.38525614899551, + "step": 18000 + }, + { + "epoch": 7.25, + "learning_rate": 4.8569088037899726e-05, + "loss": 3.4153, + "step": 18500 + }, + { + "epoch": 7.25, + "eval_bleu_bleu": 0.021439525626415767, + "eval_bleu_brevity_penalty": 0.8255209769203626, + "eval_bleu_length_ratio": 0.8391087758468014, + "eval_bleu_precisions": [ + 0.24723669864260636, + 0.04461334734169457, + 0.012771662006871938, + 0.0032294091526837735 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 199942, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 15.79750190123746, + "eval_chrf_word_order": 2, + "eval_loss": 3.3561465740203857, + "eval_meteor": 0.137741894166074, + "eval_runtime": 877.7293, + "eval_samples_per_second": 19.594, + "eval_scarebleu_bp": 0.9395116019665049, + "eval_scarebleu_counts": [ + 62993, + 10872, + 2733, + 691 + ], + "eval_scarebleu_precisions": [ + 26.696021426997337, + 4.969602779174475, + 1.3556547619047619, + 0.3744222464251074 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 2.6913605948100128, + "eval_scarebleu_sys_len": 235964, + "eval_scarebleu_totals": [ + 235964, + 218770, + 201600, + 184551 + ], + "eval_steps_per_second": 0.613, + "eval_ter_num_edits": 192383, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 88.09995924329918, + "step": 18500 + }, + { + "epoch": 7.44, + "learning_rate": 4.851973943939992e-05, + "loss": 3.4069, + "step": 19000 + }, + { + "epoch": 7.44, + "eval_bleu_bleu": 0.02182883379039864, + "eval_bleu_brevity_penalty": 0.8494751452504113, + "eval_bleu_length_ratio": 0.8597442493883221, + "eval_bleu_precisions": [ + 0.24552008942736223, + 0.04458500298405661, + 0.012609009283749625, + 0.0031590946099983716 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 204859, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 16.16336489388465, + "eval_chrf_word_order": 2, + "eval_loss": 3.343419313430786, + "eval_meteor": 0.13987079361506408, + "eval_runtime": 877.1616, + "eval_samples_per_second": 19.606, + "eval_scarebleu_bp": 0.938521316901503, + "eval_scarebleu_counts": [ + 63098, + 10971, + 2762, + 696 + ], + "eval_scarebleu_precisions": [ + 26.767064013914222, + 5.0202484727846794, + 1.3716249435111016, + 0.3776226052704396 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 2.7108093099873267, + "eval_scarebleu_sys_len": 235730, + "eval_scarebleu_totals": [ + 235730, + 218535, + 201367, + 184311 + ], + "eval_steps_per_second": 0.613, + "eval_ter_num_edits": 192393, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 88.104538647885, + "step": 19000 + }, + { + "epoch": 7.64, + "learning_rate": 4.847039084090012e-05, + "loss": 3.408, + "step": 19500 + }, + { + "epoch": 7.64, + "eval_bleu_bleu": 0.021761699095430267, + "eval_bleu_brevity_penalty": 0.8270551928815075, + "eval_bleu_length_ratio": 0.8404181652600523, + "eval_bleu_precisions": [ + 0.24913859398563823, + 0.04583171729642032, + 0.012946388210830847, + 0.003242481203007519 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 200254, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 16.082569259325737, + "eval_chrf_word_order": 2, + "eval_loss": 3.330735206604004, + "eval_meteor": 0.13926671048872225, + "eval_runtime": 893.419, + "eval_samples_per_second": 19.25, + "eval_scarebleu_bp": 0.9418820001790568, + "eval_scarebleu_counts": [ + 63512, + 11194, + 2802, + 710 + ], + "eval_scarebleu_precisions": [ + 26.85212979600465, + 5.103678441814236, + 1.3859965869463062, + 0.38353914800289546 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 2.7517246405824007, + "eval_scarebleu_sys_len": 236525, + "eval_scarebleu_totals": [ + 236525, + 219332, + 202165, + 185118 + ], + "eval_steps_per_second": 0.602, + "eval_ter_num_edits": 191943, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 87.89846544152329, + "step": 19500 + }, + { + "epoch": 7.83, + "learning_rate": 4.842114093959732e-05, + "loss": 3.3954, + "step": 20000 + }, + { + "epoch": 7.83, + "eval_bleu_bleu": 0.022401988797371063, + "eval_bleu_brevity_penalty": 0.8351610880497152, + "eval_bleu_length_ratio": 0.8473638046155977, + "eval_bleu_precisions": [ + 0.2525890376357666, + 0.04615709436597606, + 0.013087068090947066, + 0.0033928915270667755 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 201909, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 16.28928878474, + "eval_chrf_word_order": 2, + "eval_loss": 3.3119566440582275, + "eval_meteor": 0.14223875858394802, + "eval_runtime": 889.0859, + "eval_samples_per_second": 19.343, + "eval_scarebleu_bp": 0.9396850186762659, + "eval_scarebleu_counts": [ + 64476, + 11347, + 2851, + 721 + ], + "eval_scarebleu_precisions": [ + 27.319760174572572, + 5.185706516523242, + 1.4138709117508492, + 0.39055517336641227 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 2.7946443435223194, + "eval_scarebleu_sys_len": 236005, + "eval_scarebleu_totals": [ + 236005, + 218813, + 201645, + 184609 + ], + "eval_steps_per_second": 0.605, + "eval_ter_num_edits": 191466, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 87.68002784277988, + "step": 20000 + }, + { + "epoch": 8.03, + "learning_rate": 4.837179234109751e-05, + "loss": 3.3728, + "step": 20500 + }, + { + "epoch": 8.03, + "eval_bleu_bleu": 0.02251359980622517, + "eval_bleu_brevity_penalty": 0.8398818675569544, + "eval_bleu_length_ratio": 0.8514304659663672, + "eval_bleu_precisions": [ + 0.24892299805794615, + 0.046229077357230565, + 0.013255170940678067, + 0.0033848651002593086 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 202878, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 16.337921193444178, + "eval_chrf_word_order": 2, + "eval_loss": 3.309891939163208, + "eval_meteor": 0.14160529217700668, + "eval_runtime": 879.6804, + "eval_samples_per_second": 19.55, + "eval_scarebleu_bp": 0.9368730351139145, + "eval_scarebleu_counts": [ + 63629, + 11336, + 2919, + 746 + ], + "eval_scarebleu_precisions": [ + 27.036937890125394, + 5.196495940810554, + 1.4523905482662367, + 0.40558908280324035 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 2.8257919327650614, + "eval_scarebleu_sys_len": 235341, + "eval_scarebleu_totals": [ + 235341, + 218147, + 200979, + 183930 + ], + "eval_steps_per_second": 0.612, + "eval_ter_num_edits": 191794, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 87.83023231319463, + "step": 20500 + }, + { + "epoch": 8.23, + "learning_rate": 4.832244374259771e-05, + "loss": 3.3606, + "step": 21000 + }, + { + "epoch": 8.23, + "eval_bleu_bleu": 0.022482052192253157, + "eval_bleu_brevity_penalty": 0.8457603517133552, + "eval_bleu_length_ratio": 0.8565169402255339, + "eval_bleu_precisions": [ + 0.25040423342642953, + 0.046560155806910725, + 0.013190218383830053, + 0.003246731994056386 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 204090, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 16.573374566291065, + "eval_chrf_word_order": 2, + "eval_loss": 3.298384428024292, + "eval_meteor": 0.14264457653594878, + "eval_runtime": 889.5922, + "eval_samples_per_second": 19.332, + "eval_scarebleu_bp": 0.9269981806570335, + "eval_scarebleu_counts": [ + 63908, + 11331, + 2900, + 710 + ], + "eval_scarebleu_precisions": [ + 27.425618930320184, + 5.249940926002289, + 1.4597437897968943, + 0.3909218046271927 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 2.790925399476087, + "eval_scarebleu_sys_len": 233023, + "eval_scarebleu_totals": [ + 233023, + 215831, + 198665, + 181622 + ], + "eval_steps_per_second": 0.605, + "eval_ter_num_edits": 191453, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 87.67407461681832, + "step": 21000 + }, + { + "epoch": 8.42, + "learning_rate": 4.8273095144097906e-05, + "loss": 3.3366, + "step": 21500 + }, + { + "epoch": 8.42, + "eval_bleu_bleu": 0.022827351432479506, + "eval_bleu_brevity_penalty": 0.8528513005092375, + "eval_bleu_length_ratio": 0.8626861788071966, + "eval_bleu_precisions": [ + 0.25127943179606926, + 0.046764595023597304, + 0.01331550146295312, + 0.0032801763256839105 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 205560, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 16.67041572906627, + "eval_chrf_word_order": 2, + "eval_loss": 3.2855989933013916, + "eval_meteor": 0.14461757130265335, + "eval_runtime": 928.8464, + "eval_samples_per_second": 18.515, + "eval_scarebleu_bp": 0.9337602178263703, + "eval_scarebleu_counts": [ + 64472, + 11563, + 2968, + 739 + ], + "eval_scarebleu_precisions": [ + 27.480733819818592, + 5.318351370867964, + 1.4821029082774049, + 0.4033512539912125 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 2.8548095966380695, + "eval_scarebleu_sys_len": 234608, + "eval_scarebleu_totals": [ + 234608, + 217417, + 200256, + 183215 + ], + "eval_steps_per_second": 0.579, + "eval_ter_num_edits": 191539, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 87.71345749625634, + "step": 21500 + }, + { + "epoch": 8.62, + "learning_rate": 4.822384524279511e-05, + "loss": 3.3384, + "step": 22000 + }, + { + "epoch": 8.62, + "eval_bleu_bleu": 0.023237243484491143, + "eval_bleu_brevity_penalty": 0.8335344816330519, + "eval_bleu_length_ratio": 0.8459662832226088, + "eval_bleu_precisions": [ + 0.2545193872286383, + 0.047992754173400876, + 0.013759328358208955, + 0.0035937707972847066 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 201576, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 16.71530904915313, + "eval_chrf_word_order": 2, + "eval_loss": 3.271437406539917, + "eval_meteor": 0.14470863818768345, + "eval_runtime": 884.0848, + "eval_samples_per_second": 19.453, + "eval_scarebleu_bp": 0.9380046491842873, + "eval_scarebleu_counts": [ + 64864, + 11780, + 3027, + 789 + ], + "eval_scarebleu_precisions": [ + 27.530474347220807, + 5.393427161262556, + 1.5041292746191228, + 0.42833178612726175 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 2.9335330539178934, + "eval_scarebleu_sys_len": 235608, + "eval_scarebleu_totals": [ + 235608, + 218414, + 201246, + 184203 + ], + "eval_steps_per_second": 0.609, + "eval_ter_num_edits": 191050, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 87.48952461200994, + "step": 22000 + }, + { + "epoch": 8.81, + "learning_rate": 4.81744966442953e-05, + "loss": 3.3291, + "step": 22500 + }, + { + "epoch": 8.81, + "eval_bleu_bleu": 0.023596136759644382, + "eval_bleu_brevity_penalty": 0.8507284856616246, + "eval_bleu_length_ratio": 0.8608354072326978, + "eval_bleu_precisions": [ + 0.25482281017360653, + 0.048050572828811186, + 0.013689967326767458, + 0.0035306969062512193 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 205119, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 16.724494797531694, + "eval_chrf_word_order": 2, + "eval_loss": 3.261108160018921, + "eval_meteor": 0.14646205323147118, + "eval_runtime": 882.7574, + "eval_samples_per_second": 19.482, + "eval_scarebleu_bp": 0.9353326223794388, + "eval_scarebleu_counts": [ + 65396, + 11868, + 3044, + 782 + ], + "eval_scarebleu_precisions": [ + 27.830690532730724, + 5.449386094606632, + 1.5172736924480243, + 0.4259932124355154 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 2.9430702181854644, + "eval_scarebleu_sys_len": 234978, + "eval_scarebleu_totals": [ + 234978, + 217786, + 200623, + 183571 + ], + "eval_steps_per_second": 0.609, + "eval_ter_num_edits": 190706, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 87.33199309425788, + "step": 22500 + }, + { + "epoch": 9.01, + "learning_rate": 4.81251480457955e-05, + "loss": 3.3254, + "step": 23000 + }, + { + "epoch": 9.01, + "eval_bleu_bleu": 0.02339023037816696, + "eval_bleu_brevity_penalty": 0.8328548572372462, + "eval_bleu_length_ratio": 0.8453829334519618, + "eval_bleu_precisions": [ + 0.2589246265581795, + 0.04902711064072295, + 0.013907756386855853, + 0.0035236598102952148 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 201437, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 16.752894698615002, + "eval_chrf_word_order": 2, + "eval_loss": 3.250777244567871, + "eval_meteor": 0.14700242674917954, + "eval_runtime": 907.1817, + "eval_samples_per_second": 18.958, + "eval_scarebleu_bp": 0.9286232408700106, + "eval_scarebleu_counts": [ + 65563, + 12031, + 3058, + 768 + ], + "eval_scarebleu_precisions": [ + 28.09004168755329, + 5.564471742880797, + 1.5363205675041574, + 0.42197338490785813 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 2.946289079247736, + "eval_scarebleu_sys_len": 233403, + "eval_scarebleu_totals": [ + 233403, + 216211, + 199047, + 182002 + ], + "eval_steps_per_second": 0.593, + "eval_ter_num_edits": 190516, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 87.24498440712739, + "step": 23000 + }, + { + "epoch": 9.2, + "learning_rate": 4.80757994472957e-05, + "loss": 3.2912, + "step": 23500 + }, + { + "epoch": 9.2, + "eval_bleu_bleu": 0.023699725848817972, + "eval_bleu_brevity_penalty": 0.8426840728945709, + "eval_bleu_length_ratio": 0.8538519970286933, + "eval_bleu_precisions": [ + 0.25751148902705756, + 0.04871069401867252, + 0.014002140529928984, + 0.0035620399579390115 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 203455, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 16.838774113485186, + "eval_chrf_word_order": 2, + "eval_loss": 3.2368876934051514, + "eval_meteor": 0.1477524039924432, + "eval_runtime": 887.6733, + "eval_samples_per_second": 19.374, + "eval_scarebleu_bp": 0.9315166121121369, + "eval_scarebleu_counts": [ + 65516, + 11962, + 3098, + 793 + ], + "eval_scarebleu_precisions": [ + 27.988602235978146, + 5.515263568000221, + 1.55112504130659, + 0.4340638889497077 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 2.97425082874596, + "eval_scarebleu_sys_len": 234081, + "eval_scarebleu_totals": [ + 234081, + 216889, + 199726, + 182692 + ], + "eval_steps_per_second": 0.606, + "eval_ter_num_edits": 190367, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 87.17675127879872, + "step": 23500 + }, + { + "epoch": 9.4, + "learning_rate": 4.80265495459929e-05, + "loss": 3.2849, + "step": 24000 + }, + { + "epoch": 9.4, + "eval_bleu_bleu": 0.02332301035939624, + "eval_bleu_brevity_penalty": 0.8269077562261378, + "eval_bleu_length_ratio": 0.8402922624318551, + "eval_bleu_precisions": [ + 0.2559783042991849, + 0.0490733860745662, + 0.014075677109392426, + 0.0035792470822085232 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 200224, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 16.921102275562067, + "eval_chrf_word_order": 2, + "eval_loss": 3.239072799682617, + "eval_meteor": 0.14500952618048418, + "eval_runtime": 880.401, + "eval_samples_per_second": 19.534, + "eval_scarebleu_bp": 0.9298788445021605, + "eval_scarebleu_counts": [ + 64753, + 11976, + 3088, + 789 + ], + "eval_scarebleu_precisions": [ + 27.708100660256658, + 5.5315119743193, + 1.549065444001886, + 0.4327888275756146 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 2.9605709431596625, + "eval_scarebleu_sys_len": 233697, + "eval_scarebleu_totals": [ + 233697, + 216505, + 199346, + 182306 + ], + "eval_steps_per_second": 0.611, + "eval_ter_num_edits": 190511, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 87.24269470483448, + "step": 24000 + }, + { + "epoch": 9.6, + "learning_rate": 4.797720094749309e-05, + "loss": 3.2753, + "step": 24500 + }, + { + "epoch": 9.6, + "eval_bleu_bleu": 0.02395825061517041, + "eval_bleu_brevity_penalty": 0.8246842110542032, + "eval_bleu_length_ratio": 0.8383953264870173, + "eval_bleu_precisions": [ + 0.25657749834811683, + 0.049951253710742806, + 0.014550224570354296, + 0.00381975087409643 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 199772, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 17.06130299230221, + "eval_chrf_word_order": 2, + "eval_loss": 3.2282874584198, + "eval_meteor": 0.146292035658911, + "eval_runtime": 882.4072, + "eval_samples_per_second": 19.49, + "eval_scarebleu_bp": 0.9406995743208517, + "eval_scarebleu_counts": [ + 65236, + 12208, + 3171, + 821 + ], + "eval_scarebleu_precisions": [ + 27.613706110182225, + 5.573131371233183, + 1.5707273096527161, + 0.4442256081724526 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 3.028189425458713, + "eval_scarebleu_sys_len": 236245, + "eval_scarebleu_totals": [ + 236245, + 219051, + 201881, + 184816 + ], + "eval_steps_per_second": 0.61, + "eval_ter_num_edits": 190488, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 87.2321620742871, + "step": 24500 + }, + { + "epoch": 9.79, + "learning_rate": 4.792785234899329e-05, + "loss": 3.279, + "step": 25000 + }, + { + "epoch": 9.79, + "eval_bleu_bleu": 0.024333709616576157, + "eval_bleu_brevity_penalty": 0.8481432188125936, + "eval_bleu_length_ratio": 0.8585859433689079, + "eval_bleu_precisions": [ + 0.25924930223918896, + 0.0507393710409896, + 0.0144324810122121, + 0.003569051689264136 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 204583, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 17.146246504653025, + "eval_chrf_word_order": 2, + "eval_loss": 3.2088704109191895, + "eval_meteor": 0.1499427090347041, + "eval_runtime": 880.9019, + "eval_samples_per_second": 19.523, + "eval_scarebleu_bp": 0.940484062201761, + "eval_scarebleu_counts": [ + 66371, + 12424, + 3224, + 796 + ], + "eval_scarebleu_precisions": [ + 28.10020576305918, + 5.673059360730593, + 1.5973522795961037, + 0.43077788962128344 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 3.0436637701138642, + "eval_scarebleu_sys_len": 236194, + "eval_scarebleu_totals": [ + 236194, + 219000, + 201834, + 184782 + ], + "eval_steps_per_second": 0.611, + "eval_ter_num_edits": 189936, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 86.97937894115007, + "step": 25000 + }, + { + "epoch": 9.99, + "learning_rate": 4.7878503750493486e-05, + "loss": 3.2744, + "step": 25500 + }, + { + "epoch": 9.99, + "eval_bleu_bleu": 0.02494835044120699, + "eval_bleu_brevity_penalty": 0.849012036766723, + "eval_bleu_length_ratio": 0.859341360338091, + "eval_bleu_precisions": [ + 0.2597393083711413, + 0.05054086186030889, + 0.014574813267539356, + 0.003896984073195527 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 204763, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 17.343789950074843, + "eval_chrf_word_order": 2, + "eval_loss": 3.203892469406128, + "eval_meteor": 0.15081361570338334, + "eval_runtime": 879.406, + "eval_samples_per_second": 19.556, + "eval_scarebleu_bp": 0.9234659420198147, + "eval_scarebleu_counts": [ + 65891, + 12288, + 3235, + 840 + ], + "eval_scarebleu_precisions": [ + 28.376952527788664, + 5.7151627621426275, + 1.635085342862486, + 0.4645889217665441 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 3.076605350889404, + "eval_scarebleu_sys_len": 232199, + "eval_scarebleu_totals": [ + 232199, + 215007, + 197849, + 180805 + ], + "eval_steps_per_second": 0.612, + "eval_ter_num_edits": 189717, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 86.8790899807207, + "step": 25500 + }, + { + "epoch": 10.18, + "learning_rate": 4.7829253849190683e-05, + "loss": 3.2416, + "step": 26000 + }, + { + "epoch": 10.18, + "eval_bleu_bleu": 0.02502719032734151, + "eval_bleu_brevity_penalty": 0.8473945581902994, + "eval_bleu_length_ratio": 0.8579354454232223, + "eval_bleu_precisions": [ + 0.2615884321130178, + 0.05133682984927951, + 0.014703893798025763, + 0.0038532373724839667 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 204428, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 17.319260440788415, + "eval_chrf_word_order": 2, + "eval_loss": 3.1911606788635254, + "eval_meteor": 0.15195980518271268, + "eval_runtime": 908.044, + "eval_samples_per_second": 18.94, + "eval_scarebleu_bp": 0.9339218144867768, + "eval_scarebleu_counts": [ + 66716, + 12518, + 3267, + 842 + ], + "eval_scarebleu_precisions": [ + 28.43261764530399, + 5.756672736971837, + 1.6311511423550087, + 0.4595116733428656 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 3.108173865527004, + "eval_scarebleu_sys_len": 234646, + "eval_scarebleu_totals": [ + 234646, + 217452, + 200288, + 183238 + ], + "eval_steps_per_second": 0.592, + "eval_ter_num_edits": 189561, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 86.80765126918199, + "step": 26000 + }, + { + "epoch": 10.38, + "learning_rate": 4.777990525069088e-05, + "loss": 3.2299, + "step": 26500 + }, + { + "epoch": 10.38, + "eval_bleu_bleu": 0.024514879035625367, + "eval_bleu_brevity_penalty": 0.8279197942320671, + "eval_bleu_length_ratio": 0.8411567951854758, + "eval_bleu_precisions": [ + 0.25772588933792345, + 0.05119543328658201, + 0.014828773721221463, + 0.003928904264805465 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 200430, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 17.346876093212675, + "eval_chrf_word_order": 2, + "eval_loss": 3.1929519176483154, + "eval_meteor": 0.14815875525648667, + "eval_runtime": 884.8439, + "eval_samples_per_second": 19.436, + "eval_scarebleu_bp": 0.9345764566497134, + "eval_scarebleu_counts": [ + 65578, + 12570, + 3309, + 875 + ], + "eval_scarebleu_precisions": [ + 27.92930153321976, + 5.776415497520783, + 1.6508104386695734, + 0.47706281963208913 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 3.13770894219609, + "eval_scarebleu_sys_len": 234800, + "eval_scarebleu_totals": [ + 234800, + 217609, + 200447, + 183414 + ], + "eval_steps_per_second": 0.608, + "eval_ter_num_edits": 189733, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 86.88641702805802, + "step": 26500 + }, + { + "epoch": 10.58, + "learning_rate": 4.7730556652191076e-05, + "loss": 3.2332, + "step": 27000 + }, + { + "epoch": 10.58, + "eval_bleu_bleu": 0.025381468724729746, + "eval_bleu_brevity_penalty": 0.8521970537658783, + "eval_bleu_length_ratio": 0.8621154193193693, + "eval_bleu_precisions": [ + 0.2598576602539139, + 0.05097991297926484, + 0.014934009796242825, + 0.003977368578139396 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 205424, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 17.558082822708403, + "eval_chrf_word_order": 2, + "eval_loss": 3.178480863571167, + "eval_meteor": 0.15242715751096259, + "eval_runtime": 895.6873, + "eval_samples_per_second": 19.201, + "eval_scarebleu_bp": 0.932905050897148, + "eval_scarebleu_counts": [ + 66442, + 12592, + 3331, + 881 + ], + "eval_scarebleu_precisions": [ + 28.344716668017593, + 5.797048072407856, + 1.6650587594287514, + 0.48137341682238904 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 3.1603495241221156, + "eval_scarebleu_sys_len": 234407, + "eval_scarebleu_totals": [ + 234407, + 217214, + 200053, + 183018 + ], + "eval_steps_per_second": 0.601, + "eval_ter_num_edits": 189526, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 86.79162335313163, + "step": 27000 + }, + { + "epoch": 10.77, + "learning_rate": 4.768120805369128e-05, + "loss": 3.2233, + "step": 27500 + }, + { + "epoch": 10.77, + "eval_bleu_bleu": 0.02528720906170496, + "eval_bleu_brevity_penalty": 0.8461957156284818, + "eval_bleu_length_ratio": 0.8568946487101256, + "eval_bleu_precisions": [ + 0.25996669605250267, + 0.052207117110371896, + 0.015043924727384065, + 0.0039058155434448377 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 204180, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 17.771360544985313, + "eval_chrf_word_order": 2, + "eval_loss": 3.1750001907348633, + "eval_meteor": 0.152051021810062, + "eval_runtime": 891.5235, + "eval_samples_per_second": 19.291, + "eval_scarebleu_bp": 0.9335432997765213, + "eval_scarebleu_counts": [ + 66304, + 12820, + 3356, + 871 + ], + "eval_scarebleu_precisions": [ + 28.267755812020106, + 5.897967915422588, + 1.676348796435511, + 0.47557945889868686 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 3.1697847328426128, + "eval_scarebleu_sys_len": 234557, + "eval_scarebleu_totals": [ + 234557, + 217363, + 200197, + 183145 + ], + "eval_steps_per_second": 0.603, + "eval_ter_num_edits": 189659, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 86.85252943412297, + "step": 27500 + }, + { + "epoch": 10.97, + "learning_rate": 4.763195815238847e-05, + "loss": 3.2142, + "step": 28000 + }, + { + "epoch": 10.97, + "eval_bleu_bleu": 0.02595736148891558, + "eval_bleu_brevity_penalty": 0.8551670987738492, + "eval_bleu_length_ratio": 0.8647090175802316, + "eval_bleu_precisions": [ + 0.26406266683491714, + 0.05257082340481864, + 0.015235255406011403, + 0.004013624348028412 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 206042, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 17.73460568203948, + "eval_chrf_word_order": 2, + "eval_loss": 3.1565914154052734, + "eval_meteor": 0.15547731271698373, + "eval_runtime": 889.8681, + "eval_samples_per_second": 19.326, + "eval_scarebleu_bp": 0.9446176393086152, + "eval_scarebleu_counts": [ + 67870, + 13021, + 3433, + 897 + ], + "eval_scarebleu_precisions": [ + 28.616121497297343, + 5.919120655326345, + 1.6926255170815645, + 0.4828655405187171 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 3.2401850681807827, + "eval_scarebleu_sys_len": 237174, + "eval_scarebleu_totals": [ + 237174, + 219982, + 202821, + 185766 + ], + "eval_steps_per_second": 0.605, + "eval_ter_num_edits": 189133, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 86.61165275290907, + "step": 28000 + }, + { + "epoch": 11.16, + "learning_rate": 4.758260955388867e-05, + "loss": 3.1829, + "step": 28500 + }, + { + "epoch": 11.16, + "eval_bleu_bleu": 0.026275929266678603, + "eval_bleu_brevity_penalty": 0.8468242924648682, + "eval_bleu_length_ratio": 0.8574402276323134, + "eval_bleu_precisions": [ + 0.2654789290783613, + 0.053319580797041424, + 0.01550871041189864, + 0.004222470602845919 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 204310, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 17.86869148697564, + "eval_chrf_word_order": 2, + "eval_loss": 3.1434788703918457, + "eval_meteor": 0.15585251713576773, + "eval_runtime": 877.8962, + "eval_samples_per_second": 19.59, + "eval_scarebleu_bp": 0.9347931655090822, + "eval_scarebleu_counts": [ + 67769, + 13177, + 3475, + 926 + ], + "eval_scarebleu_precisions": [ + 28.85616837909994, + 6.053992961434911, + 1.7332621739846077, + 0.5048027126331512 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 3.28686719670227, + "eval_scarebleu_sys_len": 234851, + "eval_scarebleu_totals": [ + 234851, + 217658, + 200489, + 183438 + ], + "eval_steps_per_second": 0.613, + "eval_ter_num_edits": 188586, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 86.36115932206494, + "step": 28500 + }, + { + "epoch": 11.36, + "learning_rate": 4.753326095538887e-05, + "loss": 3.1779, + "step": 29000 + }, + { + "epoch": 11.36, + "eval_bleu_bleu": 0.02615967853367427, + "eval_bleu_brevity_penalty": 0.8433678399868856, + "eval_bleu_length_ratio": 0.8544437403212201, + "eval_bleu_precisions": [ + 0.26234307157311537, + 0.0537649406665093, + 0.015543857783449425, + 0.004222152181335855 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 203596, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 17.9777310351543, + "eval_chrf_word_order": 2, + "eval_loss": 3.149660348892212, + "eval_meteor": 0.1540284264069055, + "eval_runtime": 884.4756, + "eval_samples_per_second": 19.444, + "eval_scarebleu_bp": 0.9349121242618025, + "eval_scarebleu_counts": [ + 66996, + 13266, + 3518, + 934 + ], + "eval_scarebleu_precisions": [ + 28.523622801527594, + 6.094070844836853, + 1.7544122120654488, + 0.5090528564732556 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 3.3000648007197033, + "eval_scarebleu_sys_len": 234879, + "eval_scarebleu_totals": [ + 234879, + 217687, + 200523, + 183478 + ], + "eval_steps_per_second": 0.608, + "eval_ter_num_edits": 188994, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 86.54799902916622, + "step": 29000 + }, + { + "epoch": 11.56, + "learning_rate": 4.7483912356889066e-05, + "loss": 3.1863, + "step": 29500 + }, + { + "epoch": 11.56, + "eval_bleu_bleu": 0.026110169292201252, + "eval_bleu_brevity_penalty": 0.8273401863480527, + "eval_bleu_length_ratio": 0.8406615773945669, + "eval_bleu_precisions": [ + 0.26720316306561764, + 0.054286510012505396, + 0.01594780062538032, + 0.0042881301336769205 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 200312, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 17.779750872608467, + "eval_chrf_word_order": 2, + "eval_loss": 3.13206148147583, + "eval_meteor": 0.15470917708092552, + "eval_runtime": 894.1599, + "eval_samples_per_second": 19.234, + "eval_scarebleu_bp": 0.9303738499140336, + "eval_scarebleu_counts": [ + 67532, + 13157, + 3509, + 931 + ], + "eval_scarebleu_precisions": [ + 28.88291070214231, + 6.07371365789255, + 1.759223515138146, + 0.5103383252570878 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 3.295915845162185, + "eval_scarebleu_sys_len": 233813, + "eval_scarebleu_totals": [ + 233813, + 216622, + 199463, + 182428 + ], + "eval_steps_per_second": 0.602, + "eval_ter_num_edits": 188398, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 86.2750665158516, + "step": 29500 + }, + { + "epoch": 11.75, + "learning_rate": 4.7434662455586264e-05, + "loss": 3.1793, + "step": 30000 + }, + { + "epoch": 11.75, + "eval_bleu_bleu": 0.027204391480724923, + "eval_bleu_brevity_penalty": 0.8536637913132394, + "eval_bleu_length_ratio": 0.8633954314060408, + "eval_bleu_precisions": [ + 0.2659809749719291, + 0.05496592144694619, + 0.01620911981795373, + 0.004352162480732614 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 205729, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 18.225822566164823, + "eval_chrf_word_order": 2, + "eval_loss": 3.1263957023620605, + "eval_meteor": 0.15738074381287806, + "eval_runtime": 871.8454, + "eval_samples_per_second": 19.726, + "eval_scarebleu_bp": 0.9354345364233645, + "eval_scarebleu_counts": [ + 68036, + 13494, + 3633, + 960 + ], + "eval_scarebleu_precisions": [ + 28.951242968144953, + 6.19536472489532, + 1.8106696437471341, + 0.5228786649164756 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 3.3768125938029683, + "eval_scarebleu_sys_len": 235002, + "eval_scarebleu_totals": [ + 235002, + 217808, + 200644, + 183599 + ], + "eval_steps_per_second": 0.617, + "eval_ter_num_edits": 188328, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 86.2430106837509, + "step": 30000 + }, + { + "epoch": 11.95, + "learning_rate": 4.738531385708646e-05, + "loss": 3.1682, + "step": 30500 + }, + { + "epoch": 11.95, + "eval_bleu_bleu": 0.027344583512059265, + "eval_bleu_brevity_penalty": 0.8487321540495756, + "eval_bleu_length_ratio": 0.8590979482035764, + "eval_bleu_precisions": [ + 0.2663149410126768, + 0.05491411170544661, + 0.01640065978316379, + 0.0044922282495305655 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 204705, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 18.16894257827412, + "eval_chrf_word_order": 2, + "eval_loss": 3.1139681339263916, + "eval_meteor": 0.15768857142900694, + "eval_runtime": 901.344, + "eval_samples_per_second": 19.08, + "eval_scarebleu_bp": 0.9389276990807646, + "eval_scarebleu_counts": [ + 68222, + 13516, + 3645, + 988 + ], + "eval_scarebleu_precisions": [ + 28.92895609474782, + 6.182077646456145, + 1.8092742055573756, + 0.5357656079692423 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 3.406973547092888, + "eval_scarebleu_sys_len": 235826, + "eval_scarebleu_totals": [ + 235826, + 218632, + 201462, + 184409 + ], + "eval_steps_per_second": 0.597, + "eval_ter_num_edits": 188156, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 86.16424492487486, + "step": 30500 + }, + { + "epoch": 12.14, + "learning_rate": 4.7335965258586656e-05, + "loss": 3.1409, + "step": 31000 + }, + { + "epoch": 12.14, + "eval_bleu_bleu": 0.028221100607893054, + "eval_bleu_brevity_penalty": 0.8665636457811713, + "eval_bleu_length_ratio": 0.8747224891828487, + "eval_bleu_precisions": [ + 0.26668201969025274, + 0.055884413859460136, + 0.01658394797913651, + 0.004551154338236698 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 208428, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 18.425476984912066, + "eval_chrf_word_order": 2, + "eval_loss": 3.1044113636016846, + "eval_meteor": 0.16078819081656473, + "eval_runtime": 884.5639, + "eval_samples_per_second": 19.442, + "eval_scarebleu_bp": 0.9565808998138717, + "eval_scarebleu_counts": [ + 69191, + 13910, + 3776, + 1034 + ], + "eval_scarebleu_precisions": [ + 28.825739901346488, + 6.242202855886339, + 1.835941868323682, + 0.5482066643692177 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 3.509151348630738, + "eval_scarebleu_sys_len": 240032, + "eval_scarebleu_totals": [ + 240032, + 222838, + 205671, + 188615 + ], + "eval_steps_per_second": 0.608, + "eval_ter_num_edits": 187952, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 86.07082507132424, + "step": 31000 + }, + { + "epoch": 12.34, + "learning_rate": 4.728661666008686e-05, + "loss": 3.1247, + "step": 31500 + }, + { + "epoch": 12.34, + "eval_bleu_bleu": 0.02857659049084791, + "eval_bleu_brevity_penalty": 0.8585078048705035, + "eval_bleu_length_ratio": 0.8676341599553464, + "eval_bleu_precisions": [ + 0.27108092812676854, + 0.056560871124992085, + 0.016931456314058502, + 0.00472884725501676 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 206739, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 18.47157784421938, + "eval_chrf_word_order": 2, + "eval_loss": 3.0875511169433594, + "eval_meteor": 0.1617785676075214, + "eval_runtime": 882.8119, + "eval_samples_per_second": 19.481, + "eval_scarebleu_bp": 0.9347421791374203, + "eval_scarebleu_counts": [ + 69211, + 13927, + 3831, + 1072 + ], + "eval_scarebleu_precisions": [ + 29.471680598197064, + 6.398864221127693, + 1.9109138068635276, + 0.5843936370871903 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 3.560864382042178, + "eval_scarebleu_sys_len": 234839, + "eval_scarebleu_totals": [ + 234839, + 217648, + 200480, + 183438 + ], + "eval_steps_per_second": 0.609, + "eval_ter_num_edits": 187245, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 85.74706116710705, + "step": 31500 + }, + { + "epoch": 12.53, + "learning_rate": 4.723736675878405e-05, + "loss": 3.1286, + "step": 32000 + }, + { + "epoch": 12.53, + "eval_bleu_bleu": 0.028803996203757048, + "eval_bleu_brevity_penalty": 0.8518457270975438, + "eval_bleu_length_ratio": 0.8618090557707562, + "eval_bleu_precisions": [ + 0.27165195202360837, + 0.05744609612083398, + 0.01727354060802395, + 0.004849673117749025 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 205351, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 18.577654245319827, + "eval_chrf_word_order": 2, + "eval_loss": 3.08168363571167, + "eval_meteor": 0.16228566455187937, + "eval_runtime": 887.2123, + "eval_samples_per_second": 19.384, + "eval_scarebleu_bp": 0.9418777795705366, + "eval_scarebleu_counts": [ + 69445, + 14153, + 3872, + 1076 + ], + "eval_scarebleu_precisions": [ + 29.360656846662494, + 6.452774788904492, + 1.9152103912034861, + 0.5812477379415403 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 3.5893603525851834, + "eval_scarebleu_sys_len": 236524, + "eval_scarebleu_totals": [ + 236524, + 219332, + 202171, + 185119 + ], + "eval_steps_per_second": 0.606, + "eval_ter_num_edits": 187164, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 85.70996798996194, + "step": 32000 + }, + { + "epoch": 12.73, + "learning_rate": 4.7188116857481255e-05, + "loss": 3.1276, + "step": 32500 + }, + { + "epoch": 12.73, + "eval_bleu_bleu": 0.02892764859142586, + "eval_bleu_brevity_penalty": 0.8531879033134846, + "eval_bleu_length_ratio": 0.86297995207299, + "eval_bleu_precisions": [ + 0.27033506784029565, + 0.057605459649644176, + 0.017367901782326188, + 0.004886077918038311 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 205630, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 18.525666109473686, + "eval_chrf_word_order": 2, + "eval_loss": 3.0763304233551025, + "eval_meteor": 0.16157543249409256, + "eval_runtime": 885.7096, + "eval_samples_per_second": 19.417, + "eval_scarebleu_bp": 0.9328752566663009, + "eval_scarebleu_counts": [ + 69033, + 14175, + 3896, + 1083 + ], + "eval_scarebleu_precisions": [ + 29.4509385665529, + 6.5260327705829, + 1.947552063025504, + 0.5917935771544729 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 3.598947426798998, + "eval_scarebleu_sys_len": 234400, + "eval_scarebleu_totals": [ + 234400, + 217207, + 200046, + 183003 + ], + "eval_steps_per_second": 0.607, + "eval_ter_num_edits": 187113, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 85.68661302657429, + "step": 32500 + }, + { + "epoch": 12.93, + "learning_rate": 4.7138768258981444e-05, + "loss": 3.1204, + "step": 33000 + }, + { + "epoch": 12.93, + "eval_bleu_bleu": 0.02963695794821759, + "eval_bleu_brevity_penalty": 0.861184967147422, + "eval_bleu_length_ratio": 0.8699843460816942, + "eval_bleu_precisions": [ + 0.27075866260811676, + 0.05825140578726717, + 0.01769266795025238, + 0.0050265109986984925 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 207299, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 18.75576220524466, + "eval_chrf_word_order": 2, + "eval_loss": 3.0648138523101807, + "eval_meteor": 0.16350801492497355, + "eval_runtime": 875.7608, + "eval_samples_per_second": 19.638, + "eval_scarebleu_bp": 0.9414683007997822, + "eval_scarebleu_counts": [ + 69454, + 14351, + 3978, + 1112 + ], + "eval_scarebleu_precisions": [ + 29.376509451120217, + 6.5459438502064, + 1.9686247340030683, + 0.6010096096680395 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 3.656452255824203, + "eval_scarebleu_sys_len": 236427, + "eval_scarebleu_totals": [ + 236427, + 219235, + 202070, + 185022 + ], + "eval_steps_per_second": 0.614, + "eval_ter_num_edits": 186917, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 85.59685669669229, + "step": 33000 + }, + { + "epoch": 13.12, + "learning_rate": 4.708941966048164e-05, + "loss": 3.094, + "step": 33500 + }, + { + "epoch": 13.12, + "eval_bleu_bleu": 0.02970292860090122, + "eval_bleu_brevity_penalty": 0.8595602804836809, + "eval_bleu_length_ratio": 0.8685574473621259, + "eval_bleu_precisions": [ + 0.26921274262051903, + 0.058909393674314685, + 0.017802211807506706, + 0.00505053750313249 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 206959, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 18.93255020962966, + "eval_chrf_word_order": 2, + "eval_loss": 3.0691967010498047, + "eval_meteor": 0.1634356709409305, + "eval_runtime": 876.0851, + "eval_samples_per_second": 19.631, + "eval_scarebleu_bp": 0.9386356275563832, + "eval_scarebleu_counts": [ + 69094, + 14530, + 4007, + 1126 + ], + "eval_scarebleu_precisions": [ + 29.307295223471627, + 6.647938361303783, + 1.9895532318447682, + 0.610807937248435 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 3.6819490476359067, + "eval_scarebleu_sys_len": 235757, + "eval_scarebleu_totals": [ + 235757, + 218564, + 201402, + 184346 + ], + "eval_steps_per_second": 0.614, + "eval_ter_num_edits": 187110, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 85.68523920519854, + "step": 33500 + }, + { + "epoch": 13.32, + "learning_rate": 4.7040071061981844e-05, + "loss": 3.0833, + "step": 34000 + }, + { + "epoch": 13.32, + "eval_bleu_bleu": 0.030166356954517543, + "eval_bleu_brevity_penalty": 0.85309174091888, + "eval_bleu_length_ratio": 0.8628960168541919, + "eval_bleu_precisions": [ + 0.27482612713389426, + 0.059713295509428554, + 0.018170458990932288, + 0.005243406853372567 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 205610, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 18.703753280854755, + "eval_chrf_word_order": 2, + "eval_loss": 3.047536849975586, + "eval_meteor": 0.16477997462462426, + "eval_runtime": 877.5364, + "eval_samples_per_second": 19.598, + "eval_scarebleu_bp": 0.9297593262969455, + "eval_scarebleu_counts": [ + 69876, + 14589, + 4066, + 1155 + ], + "eval_scarebleu_precisions": [ + 29.903838335423185, + 6.739315212771855, + 2.0400278961020715, + 0.633682270063862 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 3.735365776511992, + "eval_scarebleu_sys_len": 233669, + "eval_scarebleu_totals": [ + 233669, + 216476, + 199311, + 182268 + ], + "eval_steps_per_second": 0.613, + "eval_ter_num_edits": 186301, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 85.31476537420605, + "step": 34000 + }, + { + "epoch": 13.51, + "learning_rate": 4.699072246348204e-05, + "loss": 3.0901, + "step": 34500 + }, + { + "epoch": 13.51, + "eval_bleu_bleu": 0.031026885630947094, + "eval_bleu_brevity_penalty": 0.8651987101314823, + "eval_bleu_length_ratio": 0.8735180187930955, + "eval_bleu_precisions": [ + 0.2753566092216334, + 0.06050338312001173, + 0.018551018177005715, + 0.00535114070502395 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 208141, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 19.11256065382046, + "eval_chrf_word_order": 2, + "eval_loss": 3.036503553390503, + "eval_meteor": 0.16759468120909937, + "eval_runtime": 884.9862, + "eval_samples_per_second": 19.433, + "eval_scarebleu_bp": 0.948483510067273, + "eval_scarebleu_counts": [ + 70898, + 15043, + 4219, + 1205 + ], + "eval_scarebleu_precisions": [ + 29.77731484203718, + 6.809837891182022, + 2.0708476290046285, + 0.6455276451901494 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 3.8485852336528135, + "eval_scarebleu_sys_len": 238094, + "eval_scarebleu_totals": [ + 238094, + 220901, + 203733, + 186669 + ], + "eval_steps_per_second": 0.608, + "eval_ter_num_edits": 186067, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 85.20760730689796, + "step": 34500 + }, + { + "epoch": 13.71, + "learning_rate": 4.6941373864982236e-05, + "loss": 3.0669, + "step": 35000 + }, + { + "epoch": 13.71, + "eval_bleu_bleu": 0.031599085732063825, + "eval_bleu_brevity_penalty": 0.8806224776379802, + "eval_bleu_length_ratio": 0.8872120497400107, + "eval_bleu_precisions": [ + 0.2766220128285179, + 0.060280419548012706, + 0.018525316991895174, + 0.005366737473447457 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 211404, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 19.29115365044828, + "eval_chrf_word_order": 2, + "eval_loss": 3.0196280479431152, + "eval_meteor": 0.16992759690994214, + "eval_runtime": 882.423, + "eval_samples_per_second": 19.49, + "eval_scarebleu_bp": 0.9480220305827978, + "eval_scarebleu_counts": [ + 71542, + 15045, + 4267, + 1225 + ], + "eval_scarebleu_precisions": [ + 30.061684819147505, + 6.814198171104539, + 2.0955804713705497, + 0.656628734073403 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 3.8844676190852114, + "eval_scarebleu_sys_len": 237984, + "eval_scarebleu_totals": [ + 237984, + 220789, + 203619, + 186559 + ], + "eval_steps_per_second": 0.61, + "eval_ter_num_edits": 185566, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 84.97817913714859, + "step": 35000 + }, + { + "epoch": 13.91, + "learning_rate": 4.689202526648244e-05, + "loss": 3.0656, + "step": 35500 + }, + { + "epoch": 13.91, + "eval_bleu_bleu": 0.032167056796921695, + "eval_bleu_brevity_penalty": 0.8782066103611217, + "eval_bleu_length_ratio": 0.8850549146168987, + "eval_bleu_precisions": [ + 0.28100905685428423, + 0.062040196802222024, + 0.018890581897894564, + 0.0054653713569413976 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 210890, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 19.372713862164563, + "eval_chrf_word_order": 2, + "eval_loss": 3.0071277618408203, + "eval_meteor": 0.17201757662703274, + "eval_runtime": 884.3852, + "eval_samples_per_second": 19.446, + "eval_scarebleu_bp": 0.9411304675395149, + "eval_scarebleu_counts": [ + 72215, + 15355, + 4342, + 1250 + ], + "eval_scarebleu_precisions": [ + 30.554650577329095, + 7.0064885879336, + 2.1496539364114344, + 0.6759533646254677 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 3.9524427629533285, + "eval_scarebleu_sys_len": 236347, + "eval_scarebleu_totals": [ + 236347, + 219154, + 201986, + 184924 + ], + "eval_steps_per_second": 0.608, + "eval_ter_num_edits": 185008, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 84.72264836126007, + "step": 35500 + }, + { + "epoch": 14.1, + "learning_rate": 4.684277536517963e-05, + "loss": 3.0518, + "step": 36000 + }, + { + "epoch": 14.1, + "eval_bleu_bleu": 0.03217199238697018, + "eval_bleu_brevity_penalty": 0.8681310949573734, + "eval_bleu_length_ratio": 0.8761074202930178, + "eval_bleu_precisions": [ + 0.2765546709587178, + 0.062313053010727426, + 0.01931622069455832, + 0.005666154256603102 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 208758, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 19.516055748389938, + "eval_chrf_word_order": 2, + "eval_loss": 3.011817216873169, + "eval_meteor": 0.169166064586573, + "eval_runtime": 884.0401, + "eval_samples_per_second": 19.454, + "eval_scarebleu_bp": 0.9412993975966291, + "eval_scarebleu_counts": [ + 71088, + 15427, + 4421, + 1267 + ], + "eval_scarebleu_precisions": [ + 30.072719735010807, + 7.038057611065996, + 2.188278036538947, + 0.6849129938860569 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 3.972543290376074, + "eval_scarebleu_sys_len": 236387, + "eval_scarebleu_totals": [ + 236387, + 219194, + 202031, + 184987 + ], + "eval_steps_per_second": 0.609, + "eval_ter_num_edits": 185595, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 84.99145941044746, + "step": 36000 + }, + { + "epoch": 14.3, + "learning_rate": 4.679342676667983e-05, + "loss": 3.0325, + "step": 36500 + }, + { + "epoch": 14.3, + "eval_bleu_bleu": 0.0323250798708925, + "eval_bleu_brevity_penalty": 0.8629647387399427, + "eval_bleu_length_ratio": 0.8715497379122793, + "eval_bleu_precisions": [ + 0.2793395354212412, + 0.0629409911801764, + 0.019430918699374612, + 0.00576271186440678 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 207672, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 19.56234828021075, + "eval_chrf_word_order": 2, + "eval_loss": 2.996340036392212, + "eval_meteor": 0.17071104693645606, + "eval_runtime": 896.3439, + "eval_samples_per_second": 19.187, + "eval_scarebleu_bp": 0.9441965831257193, + "eval_scarebleu_counts": [ + 71703, + 15633, + 4442, + 1297 + ], + "eval_scarebleu_precisions": [ + 30.244986797371286, + 7.109722487516032, + 2.191232111761717, + 0.6985587177111834 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 4.0217193598304455, + "eval_scarebleu_sys_len": 237074, + "eval_scarebleu_totals": [ + 237074, + 219882, + 202717, + 185668 + ], + "eval_steps_per_second": 0.6, + "eval_ter_num_edits": 184986, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 84.71257367117127, + "step": 36500 + }, + { + "epoch": 14.49, + "learning_rate": 4.674407816818003e-05, + "loss": 3.0366, + "step": 37000 + }, + { + "epoch": 14.49, + "eval_bleu_bleu": 0.03302145165105514, + "eval_bleu_brevity_penalty": 0.8691274556010135, + "eval_bleu_length_ratio": 0.8769887400903982, + "eval_bleu_precisions": [ + 0.2785593966540332, + 0.06377331532593222, + 0.01985992681376451, + 0.005906311061486538 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 208968, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 19.639477328259694, + "eval_chrf_word_order": 2, + "eval_loss": 2.992673873901367, + "eval_meteor": 0.17213307469030084, + "eval_runtime": 875.0232, + "eval_samples_per_second": 19.654, + "eval_scarebleu_bp": 0.9381147796960981, + "eval_scarebleu_counts": [ + 71467, + 15740, + 4557, + 1349 + ], + "eval_scarebleu_precisions": [ + 30.329663800639974, + 7.205672979641914, + 2.264111570966508, + 0.7323124026252504 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 4.09298419632058, + "eval_scarebleu_sys_len": 235634, + "eval_scarebleu_totals": [ + 235634, + 218439, + 201271, + 184211 + ], + "eval_steps_per_second": 0.615, + "eval_ter_num_edits": 185054, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 84.74371362235482, + "step": 37000 + }, + { + "epoch": 14.69, + "learning_rate": 4.6694729569680226e-05, + "loss": 3.0231, + "step": 37500 + }, + { + "epoch": 14.69, + "eval_bleu_bleu": 0.03317076201578484, + "eval_bleu_brevity_penalty": 0.868112108305403, + "eval_bleu_length_ratio": 0.8760906332492582, + "eval_bleu_precisions": [ + 0.2808664744148615, + 0.06402205064758117, + 0.019959061276210242, + 0.00593948710781916 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 208754, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 19.623767576982964, + "eval_chrf_word_order": 2, + "eval_loss": 2.9867570400238037, + "eval_meteor": 0.1726156625741791, + "eval_runtime": 885.6398, + "eval_samples_per_second": 19.419, + "eval_scarebleu_bp": 0.9451563469862228, + "eval_scarebleu_counts": [ + 72252, + 15941, + 4605, + 1372 + ], + "eval_scarebleu_precisions": [ + 30.44727815189084, + 7.2423866573984474, + 2.269121226754442, + 0.7380709021464307 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 4.143335930996988, + "eval_scarebleu_sys_len": 237302, + "eval_scarebleu_totals": [ + 237302, + 220107, + 202942, + 185890 + ], + "eval_steps_per_second": 0.607, + "eval_ter_num_edits": 184848, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 84.64937788788701, + "step": 37500 + }, + { + "epoch": 14.88, + "learning_rate": 4.664547966837742e-05, + "loss": 3.0248, + "step": 38000 + }, + { + "epoch": 14.88, + "eval_bleu_bleu": 0.03437981620102046, + "eval_bleu_brevity_penalty": 0.877081532647801, + "eval_bleu_length_ratio": 0.884051888752261, + "eval_bleu_precisions": [ + 0.281959259628485, + 0.06527065585973038, + 0.020663289904312463, + 0.006207983127342117 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 210651, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 19.887256547539568, + "eval_chrf_word_order": 2, + "eval_loss": 2.9706814289093018, + "eval_meteor": 0.17514211771946842, + "eval_runtime": 896.0598, + "eval_samples_per_second": 19.193, + "eval_scarebleu_bp": 0.9593824121130745, + "eval_scarebleu_counts": [ + 73263, + 16404, + 4804, + 1455 + ], + "eval_scarebleu_precisions": [ + 30.436715329073643, + 7.339236100236677, + 2.3281736146785432, + 0.7687065126083718 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 4.289907162266152, + "eval_scarebleu_sys_len": 240706, + "eval_scarebleu_totals": [ + 240706, + 223511, + 206342, + 189279 + ], + "eval_steps_per_second": 0.6, + "eval_ter_num_edits": 184077, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 84.29630579432063, + "step": 38000 + }, + { + "epoch": 15.08, + "learning_rate": 4.659613106987762e-05, + "loss": 2.9873, + "step": 38500 + }, + { + "epoch": 15.08, + "eval_bleu_bleu": 0.034082913568043785, + "eval_bleu_brevity_penalty": 0.8649702710414409, + "eval_bleu_length_ratio": 0.8733165742679799, + "eval_bleu_precisions": [ + 0.28413738088258617, + 0.06600348875583424, + 0.02073105456722053, + 0.006200482259731312 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 208093, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 19.86354747346183, + "eval_chrf_word_order": 2, + "eval_loss": 2.962559700012207, + "eval_meteor": 0.1751802730486169, + "eval_runtime": 889.9177, + "eval_samples_per_second": 19.325, + "eval_scarebleu_bp": 0.9426836114673405, + "eval_scarebleu_counts": [ + 72706, + 16262, + 4724, + 1408 + ], + "eval_scarebleu_precisions": [ + 30.714572376064044, + 7.407947303447051, + 2.3344880582337155, + 0.7598365919601949 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 4.225270442319805, + "eval_scarebleu_sys_len": 236715, + "eval_scarebleu_totals": [ + 236715, + 219521, + 202357, + 185303 + ], + "eval_steps_per_second": 0.605, + "eval_ter_num_edits": 183996, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 84.25921261717552, + "step": 38500 + }, + { + "epoch": 15.28, + "learning_rate": 4.6546782471377817e-05, + "loss": 2.9762, + "step": 39000 + }, + { + "epoch": 15.28, + "eval_bleu_bleu": 0.03456518440594426, + "eval_bleu_brevity_penalty": 0.8662974432839871, + "eval_bleu_length_ratio": 0.8744874705702139, + "eval_bleu_precisions": [ + 0.2844240109035763, + 0.0670886075949367, + 0.02113428719186347, + 0.0062847027660333146 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 208372, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 20.047896985935132, + "eval_chrf_word_order": 2, + "eval_loss": 2.956040382385254, + "eval_meteor": 0.17604963802463772, + "eval_runtime": 901.81, + "eval_samples_per_second": 19.071, + "eval_scarebleu_bp": 0.9485673937358009, + "eval_scarebleu_counts": [ + 73104, + 16636, + 4862, + 1446 + ], + "eval_scarebleu_precisions": [ + 30.701260740653638, + 7.53025954861897, + 2.386199111678241, + 0.774504552758436 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 4.312631935740174, + "eval_scarebleu_sys_len": 238114, + "eval_scarebleu_totals": [ + 238114, + 220922, + 203755, + 186700 + ], + "eval_steps_per_second": 0.597, + "eval_ter_num_edits": 183868, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 84.20059623847708, + "step": 39000 + }, + { + "epoch": 15.47, + "learning_rate": 4.649743387287801e-05, + "loss": 2.9957, + "step": 39500 + }, + { + "epoch": 15.47, + "eval_bleu_bleu": 0.035023715899117035, + "eval_bleu_brevity_penalty": 0.8780983875178741, + "eval_bleu_length_ratio": 0.8849583891152808, + "eval_bleu_precisions": [ + 0.28473397923809796, + 0.06683464827130406, + 0.020965631319854752, + 0.0063434753720210115 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 210867, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 20.131392423108224, + "eval_chrf_word_order": 2, + "eval_loss": 2.9500999450683594, + "eval_meteor": 0.17761180043623745, + "eval_runtime": 907.076, + "eval_samples_per_second": 18.96, + "eval_scarebleu_bp": 0.9399683461569524, + "eval_scarebleu_counts": [ + 73075, + 16527, + 4865, + 1464 + ], + "eval_scarebleu_precisions": [ + 30.95453929309702, + 7.550816211845008, + 2.411794742138739, + 0.7928212848687025 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 4.321870017829327, + "eval_scarebleu_sys_len": 236072, + "eval_scarebleu_totals": [ + 236072, + 218877, + 201717, + 184657 + ], + "eval_steps_per_second": 0.593, + "eval_ter_num_edits": 183441, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 84.00505566266274, + "step": 39500 + }, + { + "epoch": 15.67, + "learning_rate": 4.644818397157521e-05, + "loss": 2.9856, + "step": 40000 + }, + { + "epoch": 15.67, + "eval_bleu_bleu": 0.034931602049193614, + "eval_bleu_brevity_penalty": 0.8612518174468706, + "eval_bleu_length_ratio": 0.8700431007348528, + "eval_bleu_precisions": [ + 0.28507136551976964, + 0.06756259204712813, + 0.02152937163603568, + 0.0065262267126536995 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 207313, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 19.96118523920958, + "eval_chrf_word_order": 2, + "eval_loss": 2.945787191390991, + "eval_meteor": 0.17568583205559585, + "eval_runtime": 895.5463, + "eval_samples_per_second": 19.204, + "eval_scarebleu_bp": 0.9426836114673405, + "eval_scarebleu_counts": [ + 72917, + 16655, + 4939, + 1493 + ], + "eval_scarebleu_precisions": [ + 30.803709101662335, + 7.586938894507156, + 2.44072386562429, + 0.8057421948784371 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 4.364776853923994, + "eval_scarebleu_sys_len": 236715, + "eval_scarebleu_totals": [ + 236715, + 219522, + 202358, + 185295 + ], + "eval_steps_per_second": 0.601, + "eval_ter_num_edits": 183679, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 84.11404549180516, + "step": 40000 + }, + { + "epoch": 15.86, + "learning_rate": 4.639883537307541e-05, + "loss": 2.9754, + "step": 40500 + }, + { + "epoch": 15.86, + "eval_bleu_bleu": 0.03627629809343126, + "eval_bleu_brevity_penalty": 0.8704261753040108, + "eval_bleu_length_ratio": 0.8781386525879327, + "eval_bleu_precisions": [ + 0.2886992095277239, + 0.06896749233260609, + 0.022195921027804936, + 0.006826543729775256 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 209242, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 20.161244526936684, + "eval_chrf_word_order": 2, + "eval_loss": 2.9298486709594727, + "eval_meteor": 0.17948705722905844, + "eval_runtime": 913.8248, + "eval_samples_per_second": 18.82, + "eval_scarebleu_bp": 0.9422786624840854, + "eval_scarebleu_counts": [ + 73873, + 17058, + 5113, + 1572 + ], + "eval_scarebleu_precisions": [ + 31.220231680465222, + 7.773990083126732, + 2.52795933906199, + 0.8487433523202764 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 4.501279703692965, + "eval_scarebleu_sys_len": 236619, + "eval_scarebleu_totals": [ + 236619, + 219424, + 202258, + 185215 + ], + "eval_steps_per_second": 0.589, + "eval_ter_num_edits": 183029, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 83.81638419372713, + "step": 40500 + }, + { + "epoch": 16.06, + "learning_rate": 4.634948677457561e-05, + "loss": 2.9573, + "step": 41000 + }, + { + "epoch": 16.06, + "eval_bleu_bleu": 0.03596144402869662, + "eval_bleu_brevity_penalty": 0.8854762557739642, + "eval_bleu_length_ratio": 0.8915598940737539, + "eval_bleu_precisions": [ + 0.28155243833553, + 0.06744824477838214, + 0.021589479831102328, + 0.006635424102293536 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 212440, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 20.490820465423916, + "eval_chrf_word_order": 2, + "eval_loss": 2.9366397857666016, + "eval_meteor": 0.17797097455472946, + "eval_runtime": 916.2303, + "eval_samples_per_second": 18.77, + "eval_scarebleu_bp": 0.9483408925140456, + "eval_scarebleu_counts": [ + 72913, + 16880, + 5069, + 1562 + ], + "eval_scarebleu_precisions": [ + 30.627992942955558, + 7.64264305053743, + 2.4884878594782474, + 0.8368783686765321 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 4.456095334586504, + "eval_scarebleu_sys_len": 238060, + "eval_scarebleu_totals": [ + 238060, + 220866, + 203698, + 186646 + ], + "eval_steps_per_second": 0.587, + "eval_ter_num_edits": 183548, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 84.05405529173096, + "step": 41000 + }, + { + "epoch": 16.26, + "learning_rate": 4.63001381760758e-05, + "loss": 2.9339, + "step": 41500 + }, + { + "epoch": 16.26, + "eval_bleu_bleu": 0.037184521719167335, + "eval_bleu_brevity_penalty": 0.8755734148833724, + "eval_bleu_length_ratio": 0.8827089252514909, + "eval_bleu_precisions": [ + 0.29087010473967223, + 0.07062898682793473, + 0.02259928741497565, + 0.007006509638667883 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 210331, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 20.626786294078236, + "eval_chrf_word_order": 2, + "eval_loss": 2.91275691986084, + "eval_meteor": 0.18240872638212033, + "eval_runtime": 897.8606, + "eval_samples_per_second": 19.154, + "eval_scarebleu_bp": 0.9535047343719819, + "eval_scarebleu_counts": [ + 75042, + 17655, + 5284, + 1619 + ], + "eval_scarebleu_precisions": [ + 31.359749931047165, + 7.949157808004538, + 2.5784791657517068, + 0.8617523539838082 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 4.625756922544027, + "eval_scarebleu_sys_len": 239294, + "eval_scarebleu_totals": [ + 239294, + 222099, + 204927, + 187873 + ], + "eval_steps_per_second": 0.599, + "eval_ter_num_edits": 182417, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 83.5361246330752, + "step": 41500 + }, + { + "epoch": 16.45, + "learning_rate": 4.6250888274773e-05, + "loss": 2.9451, + "step": 42000 + }, + { + "epoch": 16.45, + "eval_bleu_bleu": 0.03704090126216514, + "eval_bleu_brevity_penalty": 0.8818050391190896, + "eval_bleu_length_ratio": 0.8882696334968672, + "eval_bleu_precisions": [ + 0.28823184790414635, + 0.07013231444865552, + 0.02240746276232749, + 0.006873580998478082 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 211656, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 20.664247962350412, + "eval_chrf_word_order": 2, + "eval_loss": 2.9043853282928467, + "eval_meteor": 0.18283611837442196, + "eval_runtime": 916.7802, + "eval_samples_per_second": 18.759, + "eval_scarebleu_bp": 0.9477828208683253, + "eval_scarebleu_counts": [ + 74321, + 17526, + 5247, + 1599 + ], + "eval_scarebleu_precisions": [ + 31.236891987878636, + 7.939945273000743, + 2.577567742822896, + 0.857299105706749 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 4.585807059203147, + "eval_scarebleu_sys_len": 237927, + "eval_scarebleu_totals": [ + 237927, + 220732, + 203564, + 186516 + ], + "eval_steps_per_second": 0.587, + "eval_ter_num_edits": 182439, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 83.546199323164, + "step": 42000 + }, + { + "epoch": 16.65, + "learning_rate": 4.62015396762732e-05, + "loss": 2.9329, + "step": 42500 + }, + { + "epoch": 16.65, + "eval_bleu_bleu": 0.0381028803191446, + "eval_bleu_brevity_penalty": 0.8817909682435414, + "eval_bleu_length_ratio": 0.8882570432140474, + "eval_bleu_precisions": [ + 0.2908203521802195, + 0.07157219185337935, + 0.023151150789846205, + 0.007234806905498453 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 211653, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 20.763083254978607, + "eval_chrf_word_order": 2, + "eval_loss": 2.8938395977020264, + "eval_meteor": 0.18428619317405034, + "eval_runtime": 924.8522, + "eval_samples_per_second": 18.595, + "eval_scarebleu_bp": 0.9533293961343037, + "eval_scarebleu_counts": [ + 75126, + 17888, + 5415, + 1656 + ], + "eval_scarebleu_precisions": [ + 31.400364469262534, + 8.055480500765558, + 2.642855748394276, + 0.881559124616048 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 4.697110161140854, + "eval_scarebleu_sys_len": 239252, + "eval_scarebleu_totals": [ + 239252, + 222060, + 204892, + 187849 + ], + "eval_steps_per_second": 0.582, + "eval_ter_num_edits": 182110, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 83.39553691229067, + "step": 42500 + }, + { + "epoch": 16.84, + "learning_rate": 4.61521910777734e-05, + "loss": 2.9337, + "step": 43000 + }, + { + "epoch": 16.84, + "eval_bleu_bleu": 0.037893228644499864, + "eval_bleu_brevity_penalty": 0.8922999034706497, + "eval_bleu_length_ratio": 0.8977039520897772, + "eval_bleu_precisions": [ + 0.2878487545814945, + 0.0708250724416654, + 0.02278916679197367, + 0.0070004059989419425 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 213904, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 21.043894932076533, + "eval_chrf_word_order": 2, + "eval_loss": 2.8929803371429443, + "eval_meteor": 0.18413148651243674, + "eval_runtime": 906.9462, + "eval_samples_per_second": 18.963, + "eval_scarebleu_bp": 0.9554565215977833, + "eval_scarebleu_counts": [ + 74910, + 17889, + 5398, + 1662 + ], + "eval_scarebleu_precisions": [ + 31.24348312076142, + 8.03754358218612, + 2.6280428432327168, + 0.8824372683734908 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 4.693649939622621, + "eval_scarebleu_sys_len": 239762, + "eval_scarebleu_totals": [ + 239762, + 222568, + 205400, + 188342 + ], + "eval_steps_per_second": 0.593, + "eval_ter_num_edits": 182316, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 83.48987264675847, + "step": 43000 + }, + { + "epoch": 17.04, + "learning_rate": 4.6102842479273586e-05, + "loss": 2.9164, + "step": 43500 + }, + { + "epoch": 17.04, + "eval_bleu_bleu": 0.038287985450286104, + "eval_bleu_brevity_penalty": 0.8837685593622595, + "eval_bleu_length_ratio": 0.8900280763306879, + "eval_bleu_precisions": [ + 0.2919203112106566, + 0.07276272577996716, + 0.023366773382246204, + 0.007097801609913284 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 212075, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 21.094335175974543, + "eval_chrf_word_order": 2, + "eval_loss": 2.87992000579834, + "eval_meteor": 0.18638978957132768, + "eval_runtime": 902.0525, + "eval_samples_per_second": 19.065, + "eval_scarebleu_bp": 0.9447439235212748, + "eval_scarebleu_counts": [ + 75095, + 18053, + 5475, + 1661 + ], + "eval_scarebleu_precisions": [ + 31.658403736867843, + 8.205573408360568, + 2.6991850679603036, + 0.8940008826980419 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 4.727224708278198, + "eval_scarebleu_sys_len": 237204, + "eval_scarebleu_totals": [ + 237204, + 220009, + 202839, + 185794 + ], + "eval_steps_per_second": 0.596, + "eval_ter_num_edits": 181350, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 83.04750216376867, + "step": 43500 + }, + { + "epoch": 17.23, + "learning_rate": 4.605359257797079e-05, + "loss": 2.881, + "step": 44000 + }, + { + "epoch": 17.23, + "eval_bleu_bleu": 0.03888933192169707, + "eval_bleu_brevity_penalty": 0.8834969620879023, + "eval_bleu_length_ratio": 0.8897846641961734, + "eval_bleu_precisions": [ + 0.295301791837447, + 0.07339995791051365, + 0.023605295150614616, + 0.007337200039828736 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 212017, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 21.12123937916932, + "eval_chrf_word_order": 2, + "eval_loss": 2.863369941711426, + "eval_meteor": 0.18789245874253865, + "eval_runtime": 912.6242, + "eval_samples_per_second": 18.845, + "eval_scarebleu_bp": 0.9504195202388059, + "eval_scarebleu_counts": [ + 76177, + 18301, + 5567, + 1721 + ], + "eval_scarebleu_precisions": [ + 31.93254414057915, + 8.267453311769861, + 2.7263422350423374, + 0.9196176186125049 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 4.820738559001654, + "eval_scarebleu_sys_len": 238556, + "eval_scarebleu_totals": [ + 238556, + 221362, + 204193, + 187143 + ], + "eval_steps_per_second": 0.59, + "eval_ter_num_edits": 180923, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 82.85196158795434, + "step": 44000 + }, + { + "epoch": 17.43, + "learning_rate": 4.600424397947099e-05, + "loss": 2.9064, + "step": 44500 + }, + { + "epoch": 17.43, + "eval_bleu_bleu": 0.03944762184124936, + "eval_bleu_brevity_penalty": 0.890253424712941, + "eval_bleu_length_ratio": 0.8958573772762182, + "eval_bleu_precisions": [ + 0.2921710452347937, + 0.0735979701328279, + 0.02396199132410659, + 0.007481742820487516 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 213464, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 21.29758775618743, + "eval_chrf_word_order": 2, + "eval_loss": 2.864731550216675, + "eval_meteor": 0.1882175720611228, + "eval_runtime": 900.4591, + "eval_samples_per_second": 19.099, + "eval_scarebleu_bp": 0.9455307555999646, + "eval_scarebleu_counts": [ + 75401, + 18355, + 5652, + 1759 + ], + "eval_scarebleu_precisions": [ + 31.762366728308994, + 8.335755417900415, + 2.7838524735504464, + 0.945800623722981 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 4.858492848977144, + "eval_scarebleu_sys_len": 237391, + "eval_scarebleu_totals": [ + 237391, + 220196, + 203028, + 185980 + ], + "eval_steps_per_second": 0.597, + "eval_ter_num_edits": 181271, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 83.01132486754072, + "step": 44500 + }, + { + "epoch": 17.63, + "learning_rate": 4.5954895380971183e-05, + "loss": 2.8819, + "step": 45000 + }, + { + "epoch": 17.63, + "eval_bleu_bleu": 0.040162362266498455, + "eval_bleu_brevity_penalty": 0.8842975188369437, + "eval_bleu_length_ratio": 0.8905023103168974, + "eval_bleu_precisions": [ + 0.2993383226195638, + 0.07586387273454567, + 0.024583342704842446, + 0.007621581633604585 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 212188, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 21.334558116852744, + "eval_chrf_word_order": 2, + "eval_loss": 2.8460006713867188, + "eval_meteor": 0.19133670825226476, + "eval_runtime": 928.8085, + "eval_samples_per_second": 18.516, + "eval_scarebleu_bp": 0.9344064582060225, + "eval_scarebleu_counts": [ + 76228, + 18690, + 5739, + 1776 + ], + "eval_scarebleu_precisions": [ + 32.47060828079741, + 8.590496676870467, + 2.863743874811629, + 0.9685652581749962 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 4.928091595366345, + "eval_scarebleu_sys_len": 234760, + "eval_scarebleu_totals": [ + 234760, + 217566, + 200402, + 183364 + ], + "eval_steps_per_second": 0.579, + "eval_ter_num_edits": 180130, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 82.48881480429915, + "step": 45000 + }, + { + "epoch": 17.82, + "learning_rate": 4.590554678247138e-05, + "loss": 2.8804, + "step": 45500 + }, + { + "epoch": 17.82, + "eval_bleu_bleu": 0.041374526928461414, + "eval_bleu_brevity_penalty": 0.8914910598595881, + "eval_bleu_length_ratio": 0.8969737156862334, + "eval_bleu_precisions": [ + 0.29982220558648764, + 0.07664753531159686, + 0.025258381367553765, + 0.007992758486917861 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 213730, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 21.501535461869935, + "eval_chrf_word_order": 2, + "eval_loss": 2.8354275226593018, + "eval_meteor": 0.19355277816221542, + "eval_runtime": 899.8737, + "eval_samples_per_second": 19.112, + "eval_scarebleu_bp": 0.9445755412234911, + "eval_scarebleu_counts": [ + 77024, + 19039, + 5954, + 1891 + ], + "eval_scarebleu_precisions": [ + 32.47710445092847, + 8.65527117334182, + 2.935839529792312, + 1.0180185515173374 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 5.085377446048487, + "eval_scarebleu_sys_len": 237164, + "eval_scarebleu_totals": [ + 237164, + 219970, + 202804, + 185753 + ], + "eval_steps_per_second": 0.598, + "eval_ter_num_edits": 179863, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 82.36654470185786, + "step": 45500 + }, + { + "epoch": 18.02, + "learning_rate": 4.585639557836557e-05, + "loss": 2.891, + "step": 46000 + }, + { + "epoch": 18.02, + "eval_bleu_bleu": 0.041249611314852705, + "eval_bleu_brevity_penalty": 0.8981535438696968, + "eval_bleu_length_ratio": 0.9030044611568792, + "eval_bleu_precisions": [ + 0.2977501196744854, + 0.07627302712996217, + 0.02484252208009114, + 0.007886030982579928 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 215167, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 21.778015299513235, + "eval_chrf_word_order": 2, + "eval_loss": 2.835286855697632, + "eval_meteor": 0.1932421436782551, + "eval_runtime": 888.9907, + "eval_samples_per_second": 19.346, + "eval_scarebleu_bp": 0.9429956541885958, + "eval_scarebleu_counts": [ + 76723, + 19034, + 5876, + 1838 + ], + "eval_scarebleu_precisions": [ + 32.40142067410226, + 8.667774767185046, + 2.902817847686045, + 0.9914769662315245 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 5.0280919638642825, + "eval_scarebleu_sys_len": 236789, + "eval_scarebleu_totals": [ + 236789, + 219595, + 202424, + 185380 + ], + "eval_steps_per_second": 0.605, + "eval_ter_num_edits": 180129, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 82.48835686384056, + "step": 46000 + }, + { + "epoch": 18.21, + "learning_rate": 4.5807046979865775e-05, + "loss": 2.8389, + "step": 46500 + }, + { + "epoch": 18.21, + "eval_bleu_bleu": 0.04118890727280233, + "eval_bleu_brevity_penalty": 0.8909375494842335, + "eval_bleu_length_ratio": 0.8964743011343845, + "eval_bleu_precisions": [ + 0.3004433292293, + 0.07691837732160313, + 0.025158425562299178, + 0.00785698439695334 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 213611, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 21.749185153045488, + "eval_chrf_word_order": 2, + "eval_loss": 2.8244752883911133, + "eval_meteor": 0.19377640059409074, + "eval_runtime": 897.0813, + "eval_samples_per_second": 19.171, + "eval_scarebleu_bp": 0.9429577079497464, + "eval_scarebleu_counts": [ + 77174, + 19122, + 5921, + 1836 + ], + "eval_scarebleu_precisions": [ + 32.59312441929217, + 8.708245098708929, + 2.92514956747704, + 0.9904408432773019 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 5.049525027831522, + "eval_scarebleu_sys_len": 236780, + "eval_scarebleu_totals": [ + 236780, + 219585, + 202417, + 185372 + ], + "eval_steps_per_second": 0.6, + "eval_ter_num_edits": 179800, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 82.33769445296723, + "step": 46500 + }, + { + "epoch": 18.41, + "learning_rate": 4.575769838136597e-05, + "loss": 2.8522, + "step": 47000 + }, + { + "epoch": 18.41, + "eval_bleu_bleu": 0.04205129274568246, + "eval_bleu_brevity_penalty": 0.8942081343959478, + "eval_bleu_length_ratio": 0.8994288208360787, + "eval_bleu_precisions": [ + 0.2989804726687353, + 0.0772169237012987, + 0.02549869422681558, + 0.008307869773834506 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 214315, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 21.812190278953977, + "eval_chrf_word_order": 2, + "eval_loss": 2.8207812309265137, + "eval_meteor": 0.19358828524059268, + "eval_runtime": 900.9134, + "eval_samples_per_second": 19.09, + "eval_scarebleu_bp": 0.9504446398283646, + "eval_scarebleu_counts": [ + 77240, + 19361, + 6038, + 1916 + ], + "eval_scarebleu_precisions": [ + 32.3773274871941, + 8.746109402033726, + 2.9569484370485366, + 1.0238269540079405 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 5.142903545069489, + "eval_scarebleu_sys_len": 238562, + "eval_scarebleu_totals": [ + 238562, + 221367, + 204197, + 187141 + ], + "eval_steps_per_second": 0.597, + "eval_ter_num_edits": 179751, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 82.31525537049673, + "step": 47000 + }, + { + "epoch": 18.61, + "learning_rate": 4.570834978286617e-05, + "loss": 2.8548, + "step": 47500 + }, + { + "epoch": 18.61, + "eval_bleu_bleu": 0.04201930781587565, + "eval_bleu_brevity_penalty": 0.8794010841839381, + "eval_bleu_length_ratio": 0.8861208918956349, + "eval_bleu_precisions": [ + 0.30045371878907284, + 0.07853611000830116, + 0.026017658071412816, + 0.00849048340069826 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 211144, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 21.794480469154916, + "eval_chrf_word_order": 2, + "eval_loss": 2.8178658485412598, + "eval_meteor": 0.19340476149345182, + "eval_runtime": 909.1933, + "eval_samples_per_second": 18.916, + "eval_scarebleu_bp": 0.9381274863308564, + "eval_scarebleu_counts": [ + 76706, + 19358, + 6093, + 1937 + ], + "eval_scarebleu_precisions": [ + 32.55261270513544, + 8.861848911839298, + 3.0271715099092296, + 1.0513746030884468 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 5.164021432850503, + "eval_scarebleu_sys_len": 235637, + "eval_scarebleu_totals": [ + 235637, + 218442, + 201277, + 184235 + ], + "eval_steps_per_second": 0.592, + "eval_ter_num_edits": 179612, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 82.2516016467539, + "step": 47500 + }, + { + "epoch": 18.8, + "learning_rate": 4.565900118436637e-05, + "loss": 2.8335, + "step": 48000 + }, + { + "epoch": 18.8, + "eval_bleu_bleu": 0.043065855796435744, + "eval_bleu_brevity_penalty": 0.8923138439388211, + "eval_bleu_length_ratio": 0.8977165423725968, + "eval_bleu_precisions": [ + 0.3031925088940521, + 0.07925800154540648, + 0.02646469146803297, + 0.008531656937584195 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 213907, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 22.061868304824372, + "eval_chrf_word_order": 2, + "eval_loss": 2.7998650074005127, + "eval_meteor": 0.19729723051972853, + "eval_runtime": 912.5823, + "eval_samples_per_second": 18.845, + "eval_scarebleu_bp": 0.9423166330160688, + "eval_scarebleu_counts": [ + 77837, + 19727, + 6226, + 1981 + ], + "eval_scarebleu_precisions": [ + 32.89424751086093, + 8.989987832276823, + 3.0781552822054343, + 1.0695158294821405 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 5.2636385302384365, + "eval_scarebleu_sys_len": 236628, + "eval_scarebleu_totals": [ + 236628, + 219433, + 202264, + 185224 + ], + "eval_steps_per_second": 0.59, + "eval_ter_num_edits": 179059, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 81.99836057315828, + "step": 48000 + }, + { + "epoch": 19.0, + "learning_rate": 4.560975128306356e-05, + "loss": 2.8421, + "step": 48500 + }, + { + "epoch": 19.0, + "eval_bleu_bleu": 0.04352959060144077, + "eval_bleu_brevity_penalty": 0.8827005260107943, + "eval_bleu_length_ratio": 0.8890712148363893, + "eval_bleu_precisions": [ + 0.3048709681987472, + 0.08052319010336395, + 0.02692897061474671, + 0.00894598147259826 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 211847, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 22.02867227417964, + "eval_chrf_word_order": 2, + "eval_loss": 2.793745279312134, + "eval_meteor": 0.1968760547969908, + "eval_runtime": 914.7396, + "eval_samples_per_second": 18.801, + "eval_scarebleu_bp": 0.9408812466806136, + "eval_scarebleu_counts": [ + 77888, + 19896, + 6323, + 2075 + ], + "eval_scarebleu_precisions": [ + 32.96316359696642, + 9.08107515986362, + 3.13132963892892, + 1.1223071389551456 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 5.358416653724959, + "eval_scarebleu_sys_len": 236288, + "eval_scarebleu_totals": [ + 236288, + 219093, + 201927, + 184887 + ], + "eval_steps_per_second": 0.588, + "eval_ter_num_edits": 178706, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 81.83670759127898, + "step": 48500 + }, + { + "epoch": 19.19, + "learning_rate": 4.5560402684563765e-05, + "loss": 2.804, + "step": 49000 + }, + { + "epoch": 19.19, + "eval_bleu_bleu": 0.04323777183035401, + "eval_bleu_brevity_penalty": 0.8790673218997914, + "eval_bleu_length_ratio": 0.8858229218689015, + "eval_bleu_precisions": [ + 0.3038474840458041, + 0.08034434025521205, + 0.02714309964352402, + 0.008832716733334585 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 211073, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 22.053736084145328, + "eval_chrf_word_order": 2, + "eval_loss": 2.797565221786499, + "eval_meteor": 0.1955404063849639, + "eval_runtime": 890.3842, + "eval_samples_per_second": 19.315, + "eval_scarebleu_bp": 0.9372927623670956, + "eval_scarebleu_counts": [ + 77389, + 19774, + 6322, + 2024 + ], + "eval_scarebleu_precisions": [ + 32.869945633707104, + 9.060459575248002, + 3.1440379154461677, + 1.0998266577550277 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 5.309646045393761, + "eval_scarebleu_sys_len": 235440, + "eval_scarebleu_totals": [ + 235440, + 218245, + 201079, + 184029 + ], + "eval_steps_per_second": 0.604, + "eval_ter_num_edits": 179090, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 82.0125567273743, + "step": 49000 + }, + { + "epoch": 19.39, + "learning_rate": 4.551105408606396e-05, + "loss": 2.8033, + "step": 49500 + }, + { + "epoch": 19.39, + "eval_bleu_bleu": 0.04414075522038384, + "eval_bleu_brevity_penalty": 0.890043915510267, + "eval_bleu_length_ratio": 0.8956685230339224, + "eval_bleu_precisions": [ + 0.3057366026455002, + 0.08183504566210045, + 0.027329789135096497, + 0.008846882306852323 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 213419, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 22.262097613574696, + "eval_chrf_word_order": 2, + "eval_loss": 2.778870105743408, + "eval_meteor": 0.19950101380142163, + "eval_runtime": 893.1461, + "eval_samples_per_second": 19.256, + "eval_scarebleu_bp": 0.9420550306850993, + "eval_scarebleu_counts": [ + 78339, + 20255, + 6430, + 2049 + ], + "eval_scarebleu_precisions": [ + 33.11507148110886, + 9.233216787998414, + 3.179941148834104, + 1.1066224521759795 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 5.395424198475637, + "eval_scarebleu_sys_len": 236566, + "eval_scarebleu_totals": [ + 236566, + 219371, + 202205, + 185158 + ], + "eval_steps_per_second": 0.602, + "eval_ter_num_edits": 178290, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 81.64620436050905, + "step": 49500 + }, + { + "epoch": 19.58, + "learning_rate": 4.546170548756416e-05, + "loss": 2.8025, + "step": 50000 + }, + { + "epoch": 19.58, + "eval_bleu_bleu": 0.045114153396182716, + "eval_bleu_brevity_penalty": 0.8910352476067671, + "eval_bleu_length_ratio": 0.8965624331141225, + "eval_bleu_precisions": [ + 0.3094620656081486, + 0.08249973273874066, + 0.02783215925126472, + 0.009248362590034443 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 213632, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 22.480765008773503, + "eval_chrf_word_order": 2, + "eval_loss": 2.7635321617126465, + "eval_meteor": 0.20189925998452365, + "eval_runtime": 903.6516, + "eval_samples_per_second": 19.032, + "eval_scarebleu_bp": 0.9385170829380516, + "eval_scarebleu_counts": [ + 79002, + 20395, + 6522, + 2122 + ], + "eval_scarebleu_precisions": [ + 33.51390791968744, + 9.33264389065317, + 3.2388462913670493, + 1.1512212059069258 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 5.484498264914235, + "eval_scarebleu_sys_len": 235729, + "eval_scarebleu_totals": [ + 235729, + 218534, + 201368, + 184326 + ], + "eval_steps_per_second": 0.595, + "eval_ter_num_edits": 177664, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 81.35953363343698, + "step": 50000 + }, + { + "epoch": 19.78, + "learning_rate": 4.5412455586261355e-05, + "loss": 2.7951, + "step": 50500 + }, + { + "epoch": 19.78, + "eval_bleu_bleu": 0.044936914987908305, + "eval_bleu_brevity_penalty": 0.902352164880661, + "eval_bleu_length_ratio": 0.9068235136121942, + "eval_bleu_precisions": [ + 0.30565492856713117, + 0.08181735903701692, + 0.027392134528506418, + 0.008978546191857995 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 216077, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 22.67359385140361, + "eval_chrf_word_order": 2, + "eval_loss": 2.766113758087158, + "eval_meteor": 0.20240060788488803, + "eval_runtime": 913.7196, + "eval_samples_per_second": 18.822, + "eval_scarebleu_bp": 0.9487770737121132, + "eval_scarebleu_counts": [ + 78887, + 20486, + 6504, + 2082 + ], + "eval_scarebleu_precisions": [ + 33.12297408508423, + 9.270983712647475, + 3.191379741804425, + 1.1149071981664542 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 5.454843163912916, + "eval_scarebleu_sys_len": 238164, + "eval_scarebleu_totals": [ + 238164, + 220969, + 203799, + 186742 + ], + "eval_steps_per_second": 0.589, + "eval_ter_num_edits": 178210, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 81.60956912382252, + "step": 50500 + }, + { + "epoch": 19.98, + "learning_rate": 4.536310698776155e-05, + "loss": 2.8053, + "step": 51000 + }, + { + "epoch": 19.98, + "eval_bleu_bleu": 0.0468365289023001, + "eval_bleu_brevity_penalty": 0.8948759432157701, + "eval_bleu_length_ratio": 0.9000331544114253, + "eval_bleu_precisions": [ + 0.3134911568178533, + 0.08476964879552275, + 0.02878748341319061, + 0.009808850034944028 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 214459, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 22.710695768405703, + "eval_chrf_word_order": 2, + "eval_loss": 2.7397594451904297, + "eval_meteor": 0.2058374149356775, + "eval_runtime": 895.4427, + "eval_samples_per_second": 19.206, + "eval_scarebleu_bp": 0.9500635949578059, + "eval_scarebleu_counts": [ + 80624, + 21314, + 6863, + 2266 + ], + "eval_scarebleu_precisions": [ + 33.8087230732458, + 9.632314394692601, + 3.3625179443712243, + 1.211512037596437 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 5.733774611944485, + "eval_scarebleu_sys_len": 238471, + "eval_scarebleu_totals": [ + 238471, + 221276, + 204103, + 187039 + ], + "eval_steps_per_second": 0.601, + "eval_ter_num_edits": 176758, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 80.94463957796208, + "step": 51000 + }, + { + "epoch": 20.17, + "learning_rate": 4.531375838926175e-05, + "loss": 2.7695, + "step": 51500 + }, + { + "epoch": 20.17, + "eval_bleu_bleu": 0.04581912345353732, + "eval_bleu_brevity_penalty": 0.8886694993783929, + "eval_bleu_length_ratio": 0.89443047855665, + "eval_bleu_precisions": [ + 0.3096929487059177, + 0.08359150508602606, + 0.02854937408405956, + 0.009561718513390733 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 213124, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 22.623952003912088, + "eval_chrf_word_order": 2, + "eval_loss": 2.7505061626434326, + "eval_meteor": 0.20273234089444367, + "eval_runtime": 900.5176, + "eval_samples_per_second": 19.098, + "eval_scarebleu_bp": 0.9441460451329196, + "eval_scarebleu_counts": [ + 79375, + 20772, + 6718, + 2196 + ], + "eval_scarebleu_precisions": [ + 33.48280196741781, + 9.447529642920493, + 3.314273874069433, + 1.1829028522179428 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 5.602844389281897, + "eval_scarebleu_sys_len": 237062, + "eval_scarebleu_totals": [ + 237062, + 219867, + 202699, + 185645 + ], + "eval_steps_per_second": 0.597, + "eval_ter_num_edits": 177321, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 81.2024600561435, + "step": 51500 + }, + { + "epoch": 20.37, + "learning_rate": 4.5264409790761944e-05, + "loss": 2.7689, + "step": 52000 + }, + { + "epoch": 20.37, + "eval_bleu_bleu": 0.04712499993621277, + "eval_bleu_brevity_penalty": 0.895575786959035, + "eval_bleu_length_ratio": 0.9006668653133512, + "eval_bleu_precisions": [ + 0.31078234937794136, + 0.08513537471823317, + 0.02925692730147283, + 0.00990377960568625 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 214610, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 22.95212435230834, + "eval_chrf_word_order": 2, + "eval_loss": 2.736898183822632, + "eval_meteor": 0.20530743731503906, + "eval_runtime": 889.7641, + "eval_samples_per_second": 19.329, + "eval_scarebleu_bp": 0.9453877387365368, + "eval_scarebleu_counts": [ + 79858, + 21246, + 6945, + 2282 + ], + "eval_scarebleu_precisions": [ + 33.644678690748535, + 9.650166695433363, + 3.421300241880262, + 1.2272710160749916 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 5.744545610287841, + "eval_scarebleu_sys_len": 237357, + "eval_scarebleu_totals": [ + 237357, + 220162, + 202993, + 185941 + ], + "eval_steps_per_second": 0.605, + "eval_ter_num_edits": 177018, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 81.06370409719328, + "step": 52000 + }, + { + "epoch": 20.56, + "learning_rate": 4.521515988945914e-05, + "loss": 2.7515, + "step": 52500 + }, + { + "epoch": 20.56, + "eval_bleu_bleu": 0.047929741619534734, + "eval_bleu_brevity_penalty": 0.9103819669750272, + "eval_bleu_length_ratio": 0.9141678452570307, + "eval_bleu_precisions": [ + 0.3116601706859113, + 0.08521073408030623, + 0.029333057189106112, + 0.009862631917206748 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 217827, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 23.170570445507966, + "eval_chrf_word_order": 2, + "eval_loss": 2.7223594188690186, + "eval_meteor": 0.20898087238007002, + "eval_runtime": 896.4512, + "eval_samples_per_second": 19.185, + "eval_scarebleu_bp": 0.9506330176368408, + "eval_scarebleu_counts": [ + 80577, + 21429, + 7013, + 2299 + ], + "eval_scarebleu_precisions": [ + 33.769755287984005, + 9.678337217494986, + 3.433671820683307, + 1.228150775674174 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 5.792255063987334, + "eval_scarebleu_sys_len": 238607, + "eval_scarebleu_totals": [ + 238607, + 221412, + 204242, + 187192 + ], + "eval_steps_per_second": 0.6, + "eval_ter_num_edits": 176503, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 80.82786476102378, + "step": 52500 + }, + { + "epoch": 20.76, + "learning_rate": 4.516581129095934e-05, + "loss": 2.7617, + "step": 53000 + }, + { + "epoch": 20.76, + "eval_bleu_bleu": 0.04818719599754464, + "eval_bleu_brevity_penalty": 0.8977744273183504, + "eval_bleu_length_ratio": 0.9026603267598068, + "eval_bleu_precisions": [ + 0.3164841806727573, + 0.08740714538379908, + 0.029899964589235127, + 0.010034323125969536 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 215085, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 23.171849560924045, + "eval_chrf_word_order": 2, + "eval_loss": 2.714977741241455, + "eval_meteor": 0.20984314267123733, + "eval_runtime": 895.7356, + "eval_samples_per_second": 19.2, + "eval_scarebleu_bp": 0.9444113426970282, + "eval_scarebleu_counts": [ + 81140, + 21813, + 7122, + 2340 + ], + "eval_scarebleu_precisions": [ + 34.218239325250394, + 9.918155776838084, + 3.512527125665812, + 1.2600833593606962 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 5.879468682325345, + "eval_scarebleu_sys_len": 237125, + "eval_scarebleu_totals": [ + 237125, + 219930, + 202760, + 185702 + ], + "eval_steps_per_second": 0.601, + "eval_ter_num_edits": 176010, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 80.60210011494306, + "step": 53000 + }, + { + "epoch": 20.96, + "learning_rate": 4.5116462692459535e-05, + "loss": 2.7502, + "step": 53500 + }, + { + "epoch": 20.96, + "eval_bleu_bleu": 0.04844675903421284, + "eval_bleu_brevity_penalty": 0.9040271768582423, + "eval_bleu_length_ratio": 0.9083511345943202, + "eval_bleu_precisions": [ + 0.3120388466140888, + 0.08666171466428435, + 0.0299522214289637, + 0.010182818235785852 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 216441, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 23.216967057942753, + "eval_chrf_word_order": 2, + "eval_loss": 2.717315912246704, + "eval_meteor": 0.20808723960111017, + "eval_runtime": 893.1055, + "eval_samples_per_second": 19.256, + "eval_scarebleu_bp": 0.9540138840147839, + "eval_scarebleu_counts": [ + 80851, + 21792, + 7184, + 2383 + ], + "eval_scarebleu_precisions": [ + 33.770090553680625, + 9.806453935496645, + 3.503552809328502, + 1.2676678210263694 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 5.90805164681067, + "eval_scarebleu_sys_len": 239416, + "eval_scarebleu_totals": [ + 239416, + 222221, + 205049, + 187983 + ], + "eval_steps_per_second": 0.602, + "eval_ter_num_edits": 176565, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 80.85625706945582, + "step": 53500 + }, + { + "epoch": 21.15, + "learning_rate": 4.506711409395973e-05, + "loss": 2.725, + "step": 54000 + }, + { + "epoch": 21.15, + "eval_bleu_bleu": 0.049064270561964586, + "eval_bleu_brevity_penalty": 0.900121026384034, + "eval_bleu_length_ratio": 0.9047922813172793, + "eval_bleu_precisions": [ + 0.31409646880928416, + 0.08767729513402353, + 0.03057221520279404, + 0.010485295013091396 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 215593, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 23.38461658995746, + "eval_chrf_word_order": 2, + "eval_loss": 2.713576316833496, + "eval_meteor": 0.20963861598458872, + "eval_runtime": 890.9345, + "eval_samples_per_second": 19.303, + "eval_scarebleu_bp": 0.9454171849655738, + "eval_scarebleu_counts": [ + 80728, + 21856, + 7241, + 2409 + ], + "eval_scarebleu_precisions": [ + 34.01021216359684, + 9.926919775263547, + 3.567030217046473, + 1.2956070906118233 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 5.9418882775455595, + "eval_scarebleu_sys_len": 237364, + "eval_scarebleu_totals": [ + 237364, + 220169, + 202998, + 185936 + ], + "eval_steps_per_second": 0.604, + "eval_ter_num_edits": 176151, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 80.66666971960305, + "step": 54000 + }, + { + "epoch": 21.35, + "learning_rate": 4.5017864192656935e-05, + "loss": 2.7261, + "step": 54500 + }, + { + "epoch": 21.35, + "eval_bleu_bleu": 0.05012352640102788, + "eval_bleu_brevity_penalty": 0.8990684401420683, + "eval_bleu_length_ratio": 0.9038354198229807, + "eval_bleu_precisions": [ + 0.3180228913704641, + 0.08969066962708785, + 0.03140019224607497, + 0.010785927687336138 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 215365, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 23.6055102953814, + "eval_chrf_word_order": 2, + "eval_loss": 2.6950557231903076, + "eval_meteor": 0.21192921952833738, + "eval_runtime": 897.8236, + "eval_samples_per_second": 19.155, + "eval_scarebleu_bp": 0.9478038063467256, + "eval_scarebleu_counts": [ + 81601, + 22343, + 7439, + 2507 + ], + "eval_scarebleu_precisions": [ + 34.295933291864905, + 10.122000389603917, + 3.6543430631834393, + 1.3442143021828068 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 6.090671117989266, + "eval_scarebleu_sys_len": 237932, + "eval_scarebleu_totals": [ + 237932, + 220737, + 203566, + 186503 + ], + "eval_steps_per_second": 0.599, + "eval_ter_num_edits": 175371, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 80.30947616190943, + "step": 54500 + }, + { + "epoch": 21.54, + "learning_rate": 4.496851559415713e-05, + "loss": 2.7317, + "step": 55000 + }, + { + "epoch": 21.54, + "eval_bleu_bleu": 0.050208139568594996, + "eval_bleu_brevity_penalty": 0.8970343163361828, + "eval_bleu_length_ratio": 0.9019888450094218, + "eval_bleu_precisions": [ + 0.31850645574037456, + 0.09028473170485005, + 0.03152135388977494, + 0.010827367378505445 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 214925, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 23.742292988035626, + "eval_chrf_word_order": 2, + "eval_loss": 2.6874306201934814, + "eval_meteor": 0.2126455810923772, + "eval_runtime": 909.4588, + "eval_samples_per_second": 18.91, + "eval_scarebleu_bp": 0.9441081400559477, + "eval_scarebleu_counts": [ + 81550, + 22508, + 7515, + 2539 + ], + "eval_scarebleu_precisions": [ + 34.4015895179559, + 10.23751694275396, + 3.707687222170144, + 1.367818816532345 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 6.137590994073925, + "eval_scarebleu_sys_len": 237053, + "eval_scarebleu_totals": [ + 237053, + 219858, + 202687, + 185624 + ], + "eval_steps_per_second": 0.592, + "eval_ter_num_edits": 175083, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 80.17758930983794, + "step": 55000 + }, + { + "epoch": 21.74, + "learning_rate": 4.491916699565733e-05, + "loss": 2.7133, + "step": 55500 + }, + { + "epoch": 21.74, + "eval_bleu_bleu": 0.050590730435689756, + "eval_bleu_brevity_penalty": 0.898356919105033, + "eval_bleu_length_ratio": 0.903189118638235, + "eval_bleu_precisions": [ + 0.3182690475858576, + 0.09017453135100194, + 0.031830898696243545, + 0.011009331079390458 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 215211, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 23.757913659660424, + "eval_chrf_word_order": 2, + "eval_loss": 2.6841437816619873, + "eval_meteor": 0.21309769118752173, + "eval_runtime": 917.619, + "eval_samples_per_second": 18.742, + "eval_scarebleu_bp": 0.9455181372427318, + "eval_scarebleu_counts": [ + 81694, + 22533, + 7535, + 2552 + ], + "eval_scarebleu_precisions": [ + 34.41370246179251, + 10.233295336364009, + 3.711383875797935, + 1.3722495859591766 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 6.153168912838404, + "eval_scarebleu_sys_len": 237388, + "eval_scarebleu_totals": [ + 237388, + 220193, + 203024, + 185972 + ], + "eval_steps_per_second": 0.586, + "eval_ter_num_edits": 175298, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 80.27604650843297, + "step": 55500 + }, + { + "epoch": 21.93, + "learning_rate": 4.486981839715752e-05, + "loss": 2.7183, + "step": 56000 + }, + { + "epoch": 21.93, + "eval_bleu_bleu": 0.05118363867584171, + "eval_bleu_brevity_penalty": 0.8960806999856069, + "eval_bleu_length_ratio": 0.9011243122558009, + "eval_bleu_precisions": [ + 0.32101025060660676, + 0.09148761669468014, + 0.03230581582303044, + 0.011219518166682988 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 214719, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 23.702669722243535, + "eval_chrf_word_order": 2, + "eval_loss": 2.675546407699585, + "eval_meteor": 0.21461276951508415, + "eval_runtime": 922.3194, + "eval_samples_per_second": 18.646, + "eval_scarebleu_bp": 0.9475729431283353, + "eval_scarebleu_counts": [ + 82266, + 22726, + 7636, + 2584 + ], + "eval_scarebleu_precisions": [ + 34.58341916200389, + 10.29807596451002, + 3.7521682087770074, + 1.385857177335014 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 6.216112274830739, + "eval_scarebleu_sys_len": 237877, + "eval_scarebleu_totals": [ + 237877, + 220682, + 203509, + 186455 + ], + "eval_steps_per_second": 0.583, + "eval_ter_num_edits": 174688, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 79.9967028286982, + "step": 56000 + }, + { + "epoch": 22.13, + "learning_rate": 4.482056849585472e-05, + "loss": 2.6921, + "step": 56500 + }, + { + "epoch": 22.13, + "eval_bleu_bleu": 0.05116228762014231, + "eval_bleu_brevity_penalty": 0.8981211852958223, + "eval_bleu_length_ratio": 0.9029750838302998, + "eval_bleu_precisions": [ + 0.32089142963376094, + 0.09192534033793852, + 0.03218313247681255, + 0.011092728371621664 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 215160, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 24.012563922072662, + "eval_chrf_word_order": 2, + "eval_loss": 2.676431894302368, + "eval_meteor": 0.2154382480843029, + "eval_runtime": 894.1319, + "eval_samples_per_second": 19.234, + "eval_scarebleu_bp": 0.944802850998912, + "eval_scarebleu_counts": [ + 82203, + 22880, + 7687, + 2607 + ], + "eval_scarebleu_precisions": [ + 34.652935274726204, + 10.398912840930267, + 3.789480949070993, + 1.4031896055244872 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 6.250967029592484, + "eval_scarebleu_sys_len": 237218, + "eval_scarebleu_totals": [ + 237218, + 220023, + 202851, + 185791 + ], + "eval_steps_per_second": 0.602, + "eval_ter_num_edits": 174668, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 79.98754401952658, + "step": 56500 + }, + { + "epoch": 22.33, + "learning_rate": 4.477121989735492e-05, + "loss": 2.6939, + "step": 57000 + }, + { + "epoch": 22.33, + "eval_bleu_bleu": 0.052296116592015385, + "eval_bleu_brevity_penalty": 0.9029000435725355, + "eval_bleu_length_ratio": 0.907322928164043, + "eval_bleu_precisions": [ + 0.3216016947584599, + 0.09269253575340951, + 0.032757226991031216, + 0.011525209880137817 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 216196, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 24.051135582593403, + "eval_chrf_word_order": 2, + "eval_loss": 2.661938428878784, + "eval_meteor": 0.21644303523708788, + "eval_runtime": 898.1637, + "eval_samples_per_second": 19.148, + "eval_scarebleu_bp": 0.9511686634668655, + "eval_scarebleu_counts": [ + 82850, + 23184, + 7831, + 2697 + ], + "eval_scarebleu_precisions": [ + 34.70375102100655, + 10.464880089915637, + 3.8317007055692014, + 1.43978987716142 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 6.363673311455668, + "eval_scarebleu_sys_len": 238735, + "eval_scarebleu_totals": [ + 238735, + 221541, + 204374, + 187319 + ], + "eval_steps_per_second": 0.599, + "eval_ter_num_edits": 174422, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 79.87489066671552, + "step": 57000 + }, + { + "epoch": 22.52, + "learning_rate": 4.4721871298855115e-05, + "loss": 2.6772, + "step": 57500 + }, + { + "epoch": 22.52, + "eval_bleu_bleu": 0.05201669258334987, + "eval_bleu_brevity_penalty": 0.9038616291527445, + "eval_bleu_length_ratio": 0.9082000512004834, + "eval_bleu_precisions": [ + 0.32220604884360343, + 0.09313742715010717, + 0.03275347830624475, + 0.011159578335150855 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 216405, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 24.21825345322858, + "eval_chrf_word_order": 2, + "eval_loss": 2.6572721004486084, + "eval_meteor": 0.2180234913423442, + "eval_runtime": 899.1116, + "eval_samples_per_second": 19.128, + "eval_scarebleu_bp": 0.9450595681563844, + "eval_scarebleu_counts": [ + 82547, + 23220, + 7806, + 2610 + ], + "eval_scarebleu_precisions": [ + 34.789003662355285, + 10.55046913692437, + 3.846968898000621, + 1.4042752379466374 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 6.3063831370574714, + "eval_scarebleu_sys_len": 237279, + "eval_scarebleu_totals": [ + 237279, + 220085, + 202913, + 185861 + ], + "eval_steps_per_second": 0.598, + "eval_ter_num_edits": 174253, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 79.79749872921523, + "step": 57500 + }, + { + "epoch": 22.72, + "learning_rate": 4.467252270035531e-05, + "loss": 2.6827, + "step": 58000 + }, + { + "epoch": 22.72, + "eval_bleu_bleu": 0.052868160524278014, + "eval_bleu_brevity_penalty": 0.9042202845605629, + "eval_bleu_length_ratio": 0.9085273985537962, + "eval_bleu_precisions": [ + 0.32389148339592483, + 0.09382401348801735, + 0.033157270551028926, + 0.01159811765275902 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 216483, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 24.33449758321573, + "eval_chrf_word_order": 2, + "eval_loss": 2.641231060028076, + "eval_meteor": 0.21982226071266364, + "eval_runtime": 899.4594, + "eval_samples_per_second": 19.12, + "eval_scarebleu_bp": 0.9568222752567327, + "eval_scarebleu_counts": [ + 83661, + 23667, + 8005, + 2734 + ], + "eval_scarebleu_precisions": [ + 34.84568286892415, + 10.618003992911461, + 3.8911735254372406, + 1.4492446329181023 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 6.466731333488236, + "eval_scarebleu_sys_len": 240090, + "eval_scarebleu_totals": [ + 240090, + 222895, + 205722, + 188650 + ], + "eval_steps_per_second": 0.598, + "eval_ter_num_edits": 173789, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 79.58501435643338, + "step": 58000 + }, + { + "epoch": 22.91, + "learning_rate": 4.462327279905251e-05, + "loss": 2.684, + "step": 58500 + }, + { + "epoch": 22.91, + "eval_bleu_bleu": 0.05307953154544375, + "eval_bleu_brevity_penalty": 0.9075346341836749, + "eval_bleu_length_ratio": 0.9115574599524088, + "eval_bleu_precisions": [ + 0.3230588614442577, + 0.09392030398480077, + 0.03326096348512772, + 0.011595234075396156 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 217205, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 24.271267623569596, + "eval_chrf_word_order": 2, + "eval_loss": 2.6418449878692627, + "eval_meteor": 0.2195449744361645, + "eval_runtime": 893.9659, + "eval_samples_per_second": 19.238, + "eval_scarebleu_bp": 0.9477114671198703, + "eval_scarebleu_counts": [ + 83031, + 23510, + 7994, + 2706 + ], + "eval_scarebleu_precisions": [ + 34.90017233407591, + 10.651745463606915, + 3.9273870642855386, + 1.451101732634774 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 6.429668983729075, + "eval_scarebleu_sys_len": 237910, + "eval_scarebleu_totals": [ + 237910, + 220715, + 203545, + 186479 + ], + "eval_steps_per_second": 0.602, + "eval_ter_num_edits": 173973, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 79.6692754008124, + "step": 58500 + }, + { + "epoch": 23.11, + "learning_rate": 4.4573924200552705e-05, + "loss": 2.6624, + "step": 59000 + }, + { + "epoch": 23.11, + "eval_bleu_bleu": 0.05382168481409135, + "eval_bleu_brevity_penalty": 0.901956050374312, + "eval_bleu_length_ratio": 0.9064625921713622, + "eval_bleu_precisions": [ + 0.3248422387969869, + 0.09523785570204782, + 0.034094725309814417, + 0.01202038423926578 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 215991, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 24.5000431213031, + "eval_chrf_word_order": 2, + "eval_loss": 2.63627552986145, + "eval_meteor": 0.22025836721540867, + "eval_runtime": 892.0038, + "eval_samples_per_second": 19.28, + "eval_scarebleu_bp": 0.9479632823440178, + "eval_scarebleu_counts": [ + 83349, + 23744, + 8150, + 2814 + ], + "eval_scarebleu_precisions": [ + 35.02500315165777, + 10.75479218755662, + 4.002828993251672, + 1.5084508627759998 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 6.5465293412127785, + "eval_scarebleu_sys_len": 237970, + "eval_scarebleu_totals": [ + 237970, + 220776, + 203606, + 186549 + ], + "eval_steps_per_second": 0.603, + "eval_ter_num_edits": 173725, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 79.55570616708415, + "step": 59000 + }, + { + "epoch": 23.31, + "learning_rate": 4.45245756020529e-05, + "loss": 2.6407, + "step": 59500 + }, + { + "epoch": 23.31, + "eval_bleu_bleu": 0.054428765578446815, + "eval_bleu_brevity_penalty": 0.9088173032067204, + "eval_bleu_length_ratio": 0.9127325530155825, + "eval_bleu_precisions": [ + 0.3253879577901924, + 0.09557142143891358, + 0.03424231172461995, + 0.01208133683272736 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 217485, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 24.501534402928776, + "eval_chrf_word_order": 2, + "eval_loss": 2.6298329830169678, + "eval_meteor": 0.22141380035693745, + "eval_runtime": 902.8679, + "eval_samples_per_second": 19.048, + "eval_scarebleu_bp": 0.9476568992331149, + "eval_scarebleu_counts": [ + 83556, + 23895, + 8213, + 2842 + ], + "eval_scarebleu_precisions": [ + 35.12276321265085, + 10.826816249966017, + 4.03523770217951, + 1.524097580857077 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 6.590129720027328, + "eval_scarebleu_sys_len": 237897, + "eval_scarebleu_totals": [ + 237897, + 220702, + 203532, + 186471 + ], + "eval_steps_per_second": 0.596, + "eval_ter_num_edits": 173350, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 79.38397849511607, + "step": 59500 + }, + { + "epoch": 23.5, + "learning_rate": 4.44752270035531e-05, + "loss": 2.6425, + "step": 60000 + }, + { + "epoch": 23.5, + "eval_bleu_bleu": 0.054978259778547145, + "eval_bleu_brevity_penalty": 0.9156770106707476, + "eval_bleu_length_ratio": 0.9190402847082622, + "eval_bleu_precisions": [ + 0.32525526512868286, + 0.09524116297393864, + 0.03426760906653668, + 0.012242268041237113 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 218988, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 24.656456217034272, + "eval_chrf_word_order": 2, + "eval_loss": 2.6207640171051025, + "eval_meteor": 0.2220244477201187, + "eval_runtime": 892.9344, + "eval_samples_per_second": 19.26, + "eval_scarebleu_bp": 0.956705756139604, + "eval_scarebleu_counts": [ + 84204, + 24005, + 8262, + 2875 + ], + "eval_scarebleu_precisions": [ + 35.07593871583175, + 10.770997949449672, + 4.016646085933474, + 1.5241720432387729 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 6.634666356709226, + "eval_scarebleu_sys_len": 240062, + "eval_scarebleu_totals": [ + 240062, + 222867, + 205694, + 188627 + ], + "eval_steps_per_second": 0.603, + "eval_ter_num_edits": 173219, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 79.32398829504189, + "step": 60000 + }, + { + "epoch": 23.7, + "learning_rate": 4.44259771022503e-05, + "loss": 2.6505, + "step": 60500 + }, + { + "epoch": 23.7, + "eval_bleu_bleu": 0.05561466598702213, + "eval_bleu_brevity_penalty": 0.9168274909956059, + "eval_bleu_length_ratio": 0.9201020652260585, + "eval_bleu_precisions": [ + 0.3294821680251413, + 0.09704225770369124, + 0.034728194144721544, + 0.012193596425912136 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 219241, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 24.89275403380587, + "eval_chrf_word_order": 2, + "eval_loss": 2.6011619567871094, + "eval_meteor": 0.22617831696136273, + "eval_runtime": 898.9746, + "eval_samples_per_second": 19.131, + "eval_scarebleu_bp": 0.9531957854224125, + "eval_scarebleu_counts": [ + 85031, + 24392, + 8370, + 2888 + ], + "eval_scarebleu_precisions": [ + 35.54510492433743, + 10.986150208309875, + 4.0858766328861815, + 1.537945394418025 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 6.7088022096001785, + "eval_scarebleu_sys_len": 239220, + "eval_scarebleu_totals": [ + 239220, + 222025, + 204852, + 187783 + ], + "eval_steps_per_second": 0.598, + "eval_ter_num_edits": 172286, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 78.89672984718527, + "step": 60500 + }, + { + "epoch": 23.89, + "learning_rate": 4.437662850375049e-05, + "loss": 2.6491, + "step": 61000 + }, + { + "epoch": 23.89, + "eval_bleu_bleu": 0.05478926295904038, + "eval_bleu_brevity_penalty": 0.9084647180760549, + "eval_bleu_length_ratio": 0.9124094024232098, + "eval_bleu_precisions": [ + 0.3263219384751251, + 0.0968069006508069, + 0.03452985103163461, + 0.012128365561222954 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 217408, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 24.7250111889774, + "eval_chrf_word_order": 2, + "eval_loss": 2.612759828567505, + "eval_meteor": 0.2221017980499946, + "eval_runtime": 894.999, + "eval_samples_per_second": 19.216, + "eval_scarebleu_bp": 0.9587263522772674, + "eval_scarebleu_counts": [ + 84537, + 24414, + 8388, + 2905 + ], + "eval_scarebleu_precisions": [ + 35.143505662071604, + 10.930679238693907, + 4.068250380731587, + 1.536021150033047 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 6.710717242605423, + "eval_scarebleu_sys_len": 240548, + "eval_scarebleu_totals": [ + 240548, + 223353, + 206182, + 189125 + ], + "eval_steps_per_second": 0.601, + "eval_ter_num_edits": 173076, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 79.25850280946472, + "step": 61000 + }, + { + "epoch": 24.09, + "learning_rate": 4.432727990525069e-05, + "loss": 2.6231, + "step": 61500 + }, + { + "epoch": 24.09, + "eval_bleu_bleu": 0.05610299393185716, + "eval_bleu_brevity_penalty": 0.9094672291289463, + "eval_bleu_length_ratio": 0.9133284930690493, + "eval_bleu_precisions": [ + 0.32880570885046434, + 0.09806318352358905, + 0.03538905590990686, + 0.01269058430818272 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 217627, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 24.990281809660868, + "eval_chrf_word_order": 2, + "eval_loss": 2.6066319942474365, + "eval_meteor": 0.22500605839137205, + "eval_runtime": 911.5451, + "eval_samples_per_second": 18.867, + "eval_scarebleu_bp": 0.9486554644055396, + "eval_scarebleu_counts": [ + 84527, + 24591, + 8548, + 3016 + ], + "eval_scarebleu_precisions": [ + 35.495412266151554, + 11.130171087172988, + 4.1949050649994355, + 1.6153912074727912 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 6.823811033343128, + "eval_scarebleu_sys_len": 238135, + "eval_scarebleu_totals": [ + 238135, + 220940, + 203771, + 186704 + ], + "eval_steps_per_second": 0.59, + "eval_ter_num_edits": 172545, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 79.0153364259579, + "step": 61500 + }, + { + "epoch": 24.29, + "learning_rate": 4.427793130675089e-05, + "loss": 2.6176, + "step": 62000 + }, + { + "epoch": 24.29, + "eval_bleu_bleu": 0.056983168433011266, + "eval_bleu_brevity_penalty": 0.9169183863639909, + "eval_bleu_length_ratio": 0.9201860004448567, + "eval_bleu_precisions": [ + 0.330405316038876, + 0.09885383983450952, + 0.03571447885739626, + 0.012787297276371195 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 219261, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 25.202633791241606, + "eval_chrf_word_order": 2, + "eval_loss": 2.588744878768921, + "eval_meteor": 0.228321315655883, + "eval_runtime": 911.0526, + "eval_samples_per_second": 18.877, + "eval_scarebleu_bp": 0.9573963583182418, + "eval_scarebleu_counts": [ + 85508, + 24972, + 8695, + 3039 + ], + "eval_scarebleu_precisions": [ + 35.59451854071965, + 11.196549389552219, + 4.223703257522029, + 1.6096398305084745 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 6.9073924120145955, + "eval_scarebleu_sys_len": 240228, + "eval_scarebleu_totals": [ + 240228, + 223033, + 205862, + 188800 + ], + "eval_steps_per_second": 0.591, + "eval_ter_num_edits": 171911, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 78.72500217521717, + "step": 62000 + }, + { + "epoch": 24.48, + "learning_rate": 4.422868140544809e-05, + "loss": 2.6146, + "step": 62500 + }, + { + "epoch": 24.48, + "eval_bleu_bleu": 0.05780323062255137, + "eval_bleu_brevity_penalty": 0.9169592868094966, + "eval_bleu_length_ratio": 0.9202237712933158, + "eval_bleu_precisions": [ + 0.33067451087700095, + 0.09998267969813188, + 0.036368454354209816, + 0.013132817153067302 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 219270, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 25.211527211533475, + "eval_chrf_word_order": 2, + "eval_loss": 2.586228609085083, + "eval_meteor": 0.2284859942830685, + "eval_runtime": 905.2887, + "eval_samples_per_second": 18.997, + "eval_scarebleu_bp": 0.9556856596327425, + "eval_scarebleu_counts": [ + 85432, + 25140, + 8798, + 3108 + ], + "eval_scarebleu_precisions": [ + 35.62382983691732, + 11.29268446065528, + 4.282348818192438, + 1.649804125571964 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 6.977954380262084, + "eval_scarebleu_sys_len": 239817, + "eval_scarebleu_totals": [ + 239817, + 222622, + 205448, + 188386 + ], + "eval_steps_per_second": 0.594, + "eval_ter_num_edits": 172014, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 78.77217004245108, + "step": 62500 + }, + { + "epoch": 24.68, + "learning_rate": 4.4179332806948285e-05, + "loss": 2.6063, + "step": 63000 + }, + { + "epoch": 24.68, + "eval_bleu_bleu": 0.05742490650909593, + "eval_bleu_brevity_penalty": 0.9142155647669955, + "eval_bleu_length_ratio": 0.9176931244465522, + "eval_bleu_precisions": [ + 0.3324552858913325, + 0.10061944091486658, + 0.036296557523804354, + 0.012821125868190458 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 218667, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 25.342155700236233, + "eval_chrf_word_order": 2, + "eval_loss": 2.5770907402038574, + "eval_meteor": 0.22953669307513327, + "eval_runtime": 913.6091, + "eval_samples_per_second": 18.824, + "eval_scarebleu_bp": 0.961783055700235, + "eval_scarebleu_counts": [ + 86189, + 25380, + 8820, + 3069 + ], + "eval_scarebleu_precisions": [ + 35.72082806639451, + 11.325806595564282, + 4.262537514679657, + 1.6165564030171506 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 6.988589887587128, + "eval_scarebleu_sys_len": 241285, + "eval_scarebleu_totals": [ + 241285, + 224090, + 206919, + 189848 + ], + "eval_steps_per_second": 0.589, + "eval_ter_num_edits": 171379, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 78.48137785125178, + "step": 63000 + }, + { + "epoch": 24.87, + "learning_rate": 4.412998420844848e-05, + "loss": 2.6212, + "step": 63500 + }, + { + "epoch": 24.87, + "eval_bleu_bleu": 0.057523331929043374, + "eval_bleu_brevity_penalty": 0.9152128376971128, + "eval_bleu_length_ratio": 0.9186122150923917, + "eval_bleu_precisions": [ + 0.3307703553447914, + 0.09978134869676882, + 0.03630185979971388, + 0.013025154905027399 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 218886, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 25.298545928563804, + "eval_chrf_word_order": 2, + "eval_loss": 2.5869178771972656, + "eval_meteor": 0.22823772849104643, + "eval_runtime": 913.3315, + "eval_samples_per_second": 18.83, + "eval_scarebleu_bp": 0.9542308234814221, + "eval_scarebleu_counts": [ + 85460, + 25088, + 8774, + 3102 + ], + "eval_scarebleu_precisions": [ + 35.68744049309302, + 11.287020915720758, + 4.277829783914502, + 1.6497016497016497 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 6.967618297013175, + "eval_scarebleu_sys_len": 239468, + "eval_scarebleu_totals": [ + 239468, + 222273, + 205104, + 188034 + ], + "eval_steps_per_second": 0.589, + "eval_ter_num_edits": 172013, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 78.77171210199249, + "step": 63500 + }, + { + "epoch": 25.07, + "learning_rate": 4.408063560994868e-05, + "loss": 2.5937, + "step": 64000 + }, + { + "epoch": 25.07, + "eval_bleu_bleu": 0.058653795077991004, + "eval_bleu_brevity_penalty": 0.9186076605979033, + "eval_bleu_length_ratio": 0.9217471955145019, + "eval_bleu_precisions": [ + 0.333451712629705, + 0.10113713828431421, + 0.03687812354953963, + 0.013364471541816712 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 219633, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 25.504073578705277, + "eval_chrf_word_order": 2, + "eval_loss": 2.5640196800231934, + "eval_meteor": 0.2317973104053829, + "eval_runtime": 905.7823, + "eval_samples_per_second": 18.987, + "eval_scarebleu_bp": 0.9588135738902916, + "eval_scarebleu_counts": [ + 86402, + 25568, + 9002, + 3202 + ], + "eval_scarebleu_precisions": [ + 35.91568323433194, + 11.44627396205467, + 4.365558546107029, + 1.6928811229480027 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 7.118488876120189, + "eval_scarebleu_sys_len": 240569, + "eval_scarebleu_totals": [ + 240569, + 223374, + 206205, + 189145 + ], + "eval_steps_per_second": 0.594, + "eval_ter_num_edits": 171132, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 78.36826655798214, + "step": 64000 + }, + { + "epoch": 25.26, + "learning_rate": 4.4031385708645876e-05, + "loss": 2.5737, + "step": 64500 + }, + { + "epoch": 25.26, + "eval_bleu_bleu": 0.05859400213384084, + "eval_bleu_brevity_penalty": 0.9075392178018971, + "eval_bleu_length_ratio": 0.9115616567133487, + "eval_bleu_precisions": [ + 0.33727889653140336, + 0.10300433476158811, + 0.03740060593465968, + 0.013372965868187656 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 217206, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 25.60674453343085, + "eval_chrf_word_order": 2, + "eval_loss": 2.5590660572052, + "eval_meteor": 0.23255398473135155, + "eval_runtime": 897.437, + "eval_samples_per_second": 19.163, + "eval_scarebleu_bp": 0.9460900181934362, + "eval_scarebleu_counts": [ + 86324, + 25651, + 8996, + 3163 + ], + "eval_scarebleu_precisions": [ + 36.343274784863844, + 11.642135170585806, + 4.428058811079007, + 1.6996055926319975 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 7.107011483238888, + "eval_scarebleu_sys_len": 237524, + "eval_scarebleu_totals": [ + 237524, + 220329, + 203159, + 186102 + ], + "eval_steps_per_second": 0.599, + "eval_ter_num_edits": 170687, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 78.16448305391333, + "step": 64500 + }, + { + "epoch": 25.46, + "learning_rate": 4.398203711014607e-05, + "loss": 2.5721, + "step": 65000 + }, + { + "epoch": 25.46, + "eval_bleu_bleu": 0.05917854032401079, + "eval_bleu_brevity_penalty": 0.9211502484163879, + "eval_bleu_length_ratio": 0.9241015784017895, + "eval_bleu_precisions": [ + 0.33420529169732144, + 0.10212858191419662, + 0.037235530875357824, + 0.013403460142030478 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 220194, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 25.72539106295216, + "eval_chrf_word_order": 2, + "eval_loss": 2.556518793106079, + "eval_meteor": 0.23294216865027137, + "eval_runtime": 902.7761, + "eval_samples_per_second": 19.05, + "eval_scarebleu_bp": 0.9568056304638041, + "eval_scarebleu_counts": [ + 86513, + 25770, + 9075, + 3213 + ], + "eval_scarebleu_precisions": [ + 36.03417108869322, + 11.56170504865607, + 4.411314352934314, + 1.7030276046304542 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 7.156575403545769, + "eval_scarebleu_sys_len": 240086, + "eval_scarebleu_totals": [ + 240086, + 222891, + 205721, + 188664 + ], + "eval_steps_per_second": 0.596, + "eval_ter_num_edits": 171056, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 78.33346308312993, + "step": 65000 + }, + { + "epoch": 25.66, + "learning_rate": 4.393268851164627e-05, + "loss": 2.5787, + "step": 65500 + }, + { + "epoch": 25.66, + "eval_bleu_bleu": 0.05994987284667308, + "eval_bleu_brevity_penalty": 0.9177542685573163, + "eval_bleu_length_ratio": 0.9209582044577995, + "eval_bleu_precisions": [ + 0.3365171227414614, + 0.10316934487021014, + 0.03767173242427026, + 0.013921113689095127 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 219445, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 25.771083799189686, + "eval_chrf_word_order": 2, + "eval_loss": 2.5450828075408936, + "eval_meteor": 0.23416274073458743, + "eval_runtime": 912.9304, + "eval_samples_per_second": 18.838, + "eval_scarebleu_bp": 0.9566849477875489, + "eval_scarebleu_counts": [ + 86917, + 25953, + 9156, + 3270 + ], + "eval_scarebleu_precisions": [ + 36.206817547499135, + 11.645323114752626, + 4.451315559185579, + 1.733515697064156 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 7.225342781277758, + "eval_scarebleu_sys_len": 240057, + "eval_scarebleu_totals": [ + 240057, + 222862, + 205692, + 188634 + ], + "eval_steps_per_second": 0.589, + "eval_ter_num_edits": 170624, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 78.1356328050227, + "step": 65500 + }, + { + "epoch": 25.85, + "learning_rate": 4.388333991314647e-05, + "loss": 2.5906, + "step": 66000 + }, + { + "epoch": 25.85, + "eval_bleu_bleu": 0.0598648986373195, + "eval_bleu_brevity_penalty": 0.9144068930656034, + "eval_bleu_length_ratio": 0.9178693884060283, + "eval_bleu_precisions": [ + 0.3358618072415859, + 0.10360074238018202, + 0.038018008244738555, + 0.013887311992446832 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 218709, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 25.874377756737733, + "eval_chrf_word_order": 2, + "eval_loss": 2.550560474395752, + "eval_meteor": 0.2339755117263243, + "eval_runtime": 899.1529, + "eval_samples_per_second": 19.127, + "eval_scarebleu_bp": 0.9591914499422919, + "eval_scarebleu_counts": [ + 86849, + 26106, + 9230, + 3297 + ], + "eval_scarebleu_precisions": [ + 36.08784176847004, + 11.682366366097598, + 4.474218708342018, + 1.7423701942132381 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 7.262608648472597, + "eval_scarebleu_sys_len": 240660, + "eval_scarebleu_totals": [ + 240660, + 223465, + 206293, + 189225 + ], + "eval_steps_per_second": 0.598, + "eval_ter_num_edits": 170747, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 78.19195948142821, + "step": 66000 + }, + { + "epoch": 26.05, + "learning_rate": 4.383409001184366e-05, + "loss": 2.5714, + "step": 66500 + }, + { + "epoch": 26.05, + "eval_bleu_bleu": 0.06080485014488548, + "eval_bleu_brevity_penalty": 0.9158817301970796, + "eval_bleu_length_ratio": 0.9192291389505579, + "eval_bleu_precisions": [ + 0.338506069861619, + 0.10500004954468435, + 0.03868707597177928, + 0.014127764127764128 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 219033, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 26.026105955780853, + "eval_chrf_word_order": 2, + "eval_loss": 2.5397377014160156, + "eval_meteor": 0.23587960338950711, + "eval_runtime": 908.3887, + "eval_samples_per_second": 18.932, + "eval_scarebleu_bp": 0.9520635872211706, + "eval_scarebleu_counts": [ + 87080, + 26253, + 9355, + 3350 + ], + "eval_scarebleu_precisions": [ + 36.442922966825556, + 11.838794339673692, + 4.572693856802096, + 1.7863998976152895 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 7.335569363243176, + "eval_scarebleu_sys_len": 238949, + "eval_scarebleu_totals": [ + 238949, + 221754, + 204584, + 187528 + ], + "eval_steps_per_second": 0.592, + "eval_ter_num_edits": 170180, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 77.93230724141247, + "step": 66500 + }, + { + "epoch": 26.24, + "learning_rate": 4.378474141334386e-05, + "loss": 2.5528, + "step": 67000 + }, + { + "epoch": 26.24, + "eval_bleu_bleu": 0.06082477859035546, + "eval_bleu_brevity_penalty": 0.9186348855087425, + "eval_bleu_length_ratio": 0.9217723760801414, + "eval_bleu_precisions": [ + 0.3364611931396519, + 0.10445851692319852, + 0.03855058854006444, + 0.014185366549396216 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 219639, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 26.062898625449144, + "eval_chrf_word_order": 2, + "eval_loss": 2.538325786590576, + "eval_meteor": 0.23532349085355833, + "eval_runtime": 898.8563, + "eval_samples_per_second": 19.133, + "eval_scarebleu_bp": 0.9535423030384268, + "eval_scarebleu_counts": [ + 86772, + 26177, + 9294, + 3339 + ], + "eval_scarebleu_precisions": [ + 36.260305971926805, + 11.785707853836872, + 4.535074364679705, + 1.7773117295122107 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 7.305059436660398, + "eval_scarebleu_sys_len": 239303, + "eval_scarebleu_totals": [ + 239303, + 222108, + 204936, + 187868 + ], + "eval_steps_per_second": 0.599, + "eval_ter_num_edits": 170398, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 78.03213826138325, + "step": 67000 + }, + { + "epoch": 26.44, + "learning_rate": 4.373539281484406e-05, + "loss": 2.5374, + "step": 67500 + }, + { + "epoch": 26.44, + "eval_bleu_bleu": 0.06161698986746237, + "eval_bleu_brevity_penalty": 0.9120311433923404, + "eval_bleu_length_ratio": 0.9156828759563369, + "eval_bleu_precisions": [ + 0.3418382312501146, + 0.1066604309602822, + 0.039409268929503916, + 0.014499094930411537 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 218188, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 26.114334309166367, + "eval_chrf_word_order": 2, + "eval_loss": 2.5221827030181885, + "eval_meteor": 0.23777268570310298, + "eval_runtime": 908.4242, + "eval_samples_per_second": 18.932, + "eval_scarebleu_bp": 0.9519005504215242, + "eval_scarebleu_counts": [ + 87745, + 26614, + 9462, + 3407 + ], + "eval_scarebleu_precisions": [ + 36.72721945502491, + 12.003698441693164, + 4.625831715938146, + 1.8171151230699485 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 7.426948759995625, + "eval_scarebleu_sys_len": 238910, + "eval_scarebleu_totals": [ + 238910, + 221715, + 204547, + 187495 + ], + "eval_steps_per_second": 0.592, + "eval_ter_num_edits": 169561, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 77.64884209755047, + "step": 67500 + }, + { + "epoch": 26.64, + "learning_rate": 4.368604421634426e-05, + "loss": 2.5449, + "step": 68000 + }, + { + "epoch": 26.64, + "eval_bleu_bleu": 0.061473271624170364, + "eval_bleu_brevity_penalty": 0.9140424293830017, + "eval_bleu_length_ratio": 0.9175336475308357, + "eval_bleu_precisions": [ + 0.33977194242300884, + 0.10626805802396815, + 0.039114815658950065, + 0.014485995276955729 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 218629, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 26.143871121537877, + "eval_chrf_word_order": 2, + "eval_loss": 2.528550624847412, + "eval_meteor": 0.23688729672482184, + "eval_runtime": 908.2397, + "eval_samples_per_second": 18.936, + "eval_scarebleu_bp": 0.9481227342382456, + "eval_scarebleu_counts": [ + 87071, + 26471, + 9433, + 3416 + ], + "eval_scarebleu_precisions": [ + 36.58322409330779, + 11.98797172267937, + 4.6321485744591, + 1.8308794760340235 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 7.404266492162657, + "eval_scarebleu_sys_len": 238008, + "eval_scarebleu_totals": [ + 238008, + 220813, + 203642, + 186577 + ], + "eval_steps_per_second": 0.592, + "eval_ter_num_edits": 169926, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 77.81599036493276, + "step": 68000 + }, + { + "epoch": 26.83, + "learning_rate": 4.3636794315041456e-05, + "loss": 2.5519, + "step": 68500 + }, + { + "epoch": 26.83, + "eval_bleu_bleu": 0.06253638797872006, + "eval_bleu_brevity_penalty": 0.923397811130453, + "eval_bleu_length_ratio": 0.926187368588923, + "eval_bleu_precisions": [ + 0.3396876175285807, + 0.10662617447025986, + 0.039497480425671215, + 0.01470492703639617 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 220691, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 26.388923092749156, + "eval_chrf_word_order": 2, + "eval_loss": 2.5187106132507324, + "eval_meteor": 0.23907445705399216, + "eval_runtime": 914.4013, + "eval_samples_per_second": 18.808, + "eval_scarebleu_bp": 0.9610746332762926, + "eval_scarebleu_counts": [ + 88059, + 26949, + 9677, + 3522 + ], + "eval_scarebleu_precisions": [ + 36.52172831108936, + 12.035155569647953, + 4.680577321183276, + 1.8567233735219226 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 7.5556099384102415, + "eval_scarebleu_sys_len": 241114, + "eval_scarebleu_totals": [ + 241114, + 223919, + 206748, + 189689 + ], + "eval_steps_per_second": 0.588, + "eval_ter_num_edits": 169575, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 77.65525326397061, + "step": 68500 + }, + { + "epoch": 27.03, + "learning_rate": 4.358744571654165e-05, + "loss": 2.5409, + "step": 69000 + }, + { + "epoch": 27.03, + "eval_bleu_bleu": 0.06238950529415009, + "eval_bleu_brevity_penalty": 0.9188753426641745, + "eval_bleu_length_ratio": 0.9219948044099564, + "eval_bleu_precisions": [ + 0.3415281393951532, + 0.10737443023847267, + 0.03967303334412431, + 0.014608210063565615 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 219692, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 26.384141372667774, + "eval_chrf_word_order": 2, + "eval_loss": 2.515241861343384, + "eval_meteor": 0.23948042845594966, + "eval_runtime": 923.1935, + "eval_samples_per_second": 18.629, + "eval_scarebleu_bp": 0.9548104989807567, + "eval_scarebleu_counts": [ + 88070, + 26940, + 9605, + 3476 + ], + "eval_scarebleu_precisions": [ + 36.756021318241956, + 12.11265579195367, + 4.679886961605924, + 1.8471970538376103 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 7.520492822325689, + "eval_scarebleu_sys_len": 239607, + "eval_scarebleu_totals": [ + 239607, + 222412, + 205240, + 188177 + ], + "eval_steps_per_second": 0.583, + "eval_ter_num_edits": 169367, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 77.56000164858565, + "step": 69000 + }, + { + "epoch": 27.22, + "learning_rate": 4.353809711804185e-05, + "loss": 2.5159, + "step": 69500 + }, + { + "epoch": 27.22, + "eval_bleu_bleu": 0.06299317710678633, + "eval_bleu_brevity_penalty": 0.9135091826383038, + "eval_bleu_length_ratio": 0.9170426265008667, + "eval_bleu_precisions": [ + 0.3422649557003734, + 0.10776039778061465, + 0.04039312572964461, + 0.015177257445051986 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 218512, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 26.425888321512648, + "eval_chrf_word_order": 2, + "eval_loss": 2.507833480834961, + "eval_meteor": 0.23978841132680107, + "eval_runtime": 911.2561, + "eval_samples_per_second": 18.873, + "eval_scarebleu_bp": 0.9525901486005092, + "eval_scarebleu_counts": [ + 87969, + 26929, + 9738, + 3587 + ], + "eval_scarebleu_precisions": [ + 36.795566244902226, + 12.13674058049396, + 4.756950041766197, + 1.9115374367172928 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 7.604283949743582, + "eval_scarebleu_sys_len": 239075, + "eval_scarebleu_totals": [ + 239075, + 221880, + 204711, + 187650 + ], + "eval_steps_per_second": 0.59, + "eval_ter_num_edits": 169366, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 77.55954370812707, + "step": 69500 + }, + { + "epoch": 27.42, + "learning_rate": 4.348874851954205e-05, + "loss": 2.5123, + "step": 70000 + }, + { + "epoch": 27.42, + "eval_bleu_bleu": 0.06316923048459688, + "eval_bleu_brevity_penalty": 0.91673204270931, + "eval_bleu_length_ratio": 0.9200139332463205, + "eval_bleu_precisions": [ + 0.3439877748380622, + 0.10816978096770202, + 0.04039054470709147, + 0.015001131936087314 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 219220, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 26.54672997544509, + "eval_chrf_word_order": 2, + "eval_loss": 2.5011634826660156, + "eval_meteor": 0.24141487327191014, + "eval_runtime": 903.833, + "eval_samples_per_second": 19.028, + "eval_scarebleu_bp": 0.9543643023757927, + "eval_scarebleu_counts": [ + 88539, + 27176, + 9787, + 3579 + ], + "eval_scarebleu_precisions": [ + 36.96826722338204, + 12.22464631924608, + 4.771004460477247, + 1.9030249536074526 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 7.638254282514317, + "eval_scarebleu_sys_len": 239500, + "eval_scarebleu_totals": [ + 239500, + 222305, + 205135, + 188069 + ], + "eval_steps_per_second": 0.595, + "eval_ter_num_edits": 168948, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 77.36812459643997, + "step": 70000 + }, + { + "epoch": 27.61, + "learning_rate": 4.343949861823924e-05, + "loss": 2.5222, + "step": 70500 + }, + { + "epoch": 27.61, + "eval_bleu_bleu": 0.06324274590063843, + "eval_bleu_brevity_penalty": 0.9199091567354672, + "eval_bleu_length_ratio": 0.9229516659042551, + "eval_bleu_precisions": [ + 0.3434521644234267, + 0.10868911086447157, + 0.04038324747267907, + 0.014818681742411209 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 219920, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 26.69911431884916, + "eval_chrf_word_order": 2, + "eval_loss": 2.4985249042510986, + "eval_meteor": 0.24159429543557853, + "eval_runtime": 911.335, + "eval_samples_per_second": 18.871, + "eval_scarebleu_bp": 0.9530997422122419, + "eval_scarebleu_counts": [ + 88393, + 27218, + 9780, + 3540 + ], + "eval_scarebleu_precisions": [ + 36.95405878836273, + 12.260249907658489, + 4.774691207342674, + 1.8852651087489083 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 7.616547397863784, + "eval_scarebleu_sys_len": 239197, + "eval_scarebleu_totals": [ + 239197, + 222002, + 204830, + 187772 + ], + "eval_steps_per_second": 0.59, + "eval_ter_num_edits": 168949, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 77.36858253689856, + "step": 70500 + }, + { + "epoch": 27.81, + "learning_rate": 4.339015001973944e-05, + "loss": 2.514, + "step": 71000 + }, + { + "epoch": 27.81, + "eval_bleu_bleu": 0.06339116085605866, + "eval_bleu_brevity_penalty": 0.9200043270593877, + "eval_bleu_length_ratio": 0.9230397978839932, + "eval_bleu_precisions": [ + 0.34373309205650604, + 0.10876663411362, + 0.04046037211257133, + 0.014900760460784663 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 219941, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 26.617437388381994, + "eval_chrf_word_order": 2, + "eval_loss": 2.4930663108825684, + "eval_meteor": 0.24153406439036662, + "eval_runtime": 904.0788, + "eval_samples_per_second": 19.023, + "eval_scarebleu_bp": 0.9584854165955322, + "eval_scarebleu_counts": [ + 88790, + 27300, + 9823, + 3576 + ], + "eval_scarebleu_precisions": [ + 36.920454072934426, + 12.225979085962516, + 4.765554881746513, + 1.8914830369516233 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 7.655122794885874, + "eval_scarebleu_sys_len": 240490, + "eval_scarebleu_totals": [ + 240490, + 223295, + 206125, + 189058 + ], + "eval_steps_per_second": 0.595, + "eval_ter_num_edits": 169005, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 77.39422720257913, + "step": 71000 + }, + { + "epoch": 28.01, + "learning_rate": 4.334080142123964e-05, + "loss": 2.5124, + "step": 71500 + }, + { + "epoch": 28.01, + "eval_bleu_bleu": 0.06435639551810675, + "eval_bleu_brevity_penalty": 0.9250725354788072, + "eval_bleu_length_ratio": 0.9277443668976284, + "eval_bleu_precisions": [ + 0.3418000379983896, + 0.1089582914351023, + 0.04086463789539081, + 0.015391595905788348 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 221062, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 26.851272502025868, + "eval_chrf_word_order": 2, + "eval_loss": 2.4903171062469482, + "eval_meteor": 0.24246089610495208, + "eval_runtime": 908.2214, + "eval_samples_per_second": 18.936, + "eval_scarebleu_bp": 0.9663286411202541, + "eval_scarebleu_counts": [ + 88975, + 27636, + 9977, + 3671 + ], + "eval_scarebleu_precisions": [ + 36.70812962848361, + 12.272303388249922, + 4.796173444861071, + 1.9224424602655077 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 7.757718102907601, + "eval_scarebleu_sys_len": 242385, + "eval_scarebleu_totals": [ + 242385, + 225190, + 208020, + 190955 + ], + "eval_steps_per_second": 0.592, + "eval_ter_num_edits": 169002, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 77.39285338120338, + "step": 71500 + }, + { + "epoch": 28.2, + "learning_rate": 4.329145282273984e-05, + "loss": 2.4774, + "step": 72000 + }, + { + "epoch": 28.2, + "eval_bleu_bleu": 0.0650282778454471, + "eval_bleu_brevity_penalty": 0.9223582704824913, + "eval_bleu_length_ratio": 0.9252221135727445, + "eval_bleu_precisions": [ + 0.3442876517842158, + 0.1101217124359214, + 0.04151890300255765, + 0.015695319199266686 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 220461, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 26.882686536743805, + "eval_chrf_word_order": 2, + "eval_loss": 2.4854624271392822, + "eval_meteor": 0.24350141649839685, + "eval_runtime": 933.4291, + "eval_samples_per_second": 18.425, + "eval_scarebleu_bp": 0.9591706910767873, + "eval_scarebleu_counts": [ + 89076, + 27717, + 10065, + 3734 + ], + "eval_scarebleu_precisions": [ + 37.01398267229021, + 12.40356215877562, + 4.879148366830517, + 1.9733539089213141 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 7.820980663362548, + "eval_scarebleu_sys_len": 240655, + "eval_scarebleu_totals": [ + 240655, + 223460, + 206286, + 189221 + ], + "eval_steps_per_second": 0.576, + "eval_ter_num_edits": 168581, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 77.20006044814053, + "step": 72000 + }, + { + "epoch": 28.4, + "learning_rate": 4.324220292143703e-05, + "loss": 2.486, + "step": 72500 + }, + { + "epoch": 28.4, + "eval_bleu_bleu": 0.06484761387805417, + "eval_bleu_brevity_penalty": 0.9202761963787717, + "eval_bleu_length_ratio": 0.9232916035403875, + "eval_bleu_precisions": [ + 0.3451847946145699, + 0.11064761397591787, + 0.04153492305454859, + 0.015541614288086146 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 220001, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 26.92818566909605, + "eval_chrf_word_order": 2, + "eval_loss": 2.4798872470855713, + "eval_meteor": 0.24382721256749826, + "eval_runtime": 904.5458, + "eval_samples_per_second": 19.013, + "eval_scarebleu_bp": 0.9548146681462187, + "eval_scarebleu_counts": [ + 88953, + 27681, + 10061, + 3680 + ], + "eval_scarebleu_precisions": [ + 37.124386497946645, + 12.445765310480953, + 4.901970337744343, + 1.9555952342994398 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 7.789358952005704, + "eval_scarebleu_sys_len": 239608, + "eval_scarebleu_totals": [ + 239608, + 222413, + 205244, + 188178 + ], + "eval_steps_per_second": 0.595, + "eval_ter_num_edits": 168398, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 77.1162573442201, + "step": 72500 + }, + { + "epoch": 28.59, + "learning_rate": 4.319285432293723e-05, + "loss": 2.4862, + "step": 73000 + }, + { + "epoch": 28.59, + "eval_bleu_bleu": 0.06456260628036992, + "eval_bleu_brevity_penalty": 0.9210959237098734, + "eval_bleu_length_ratio": 0.9240512172705106, + "eval_bleu_precisions": [ + 0.34373836190060947, + 0.10990851630892619, + 0.04129536355417797, + 0.015471917167193849 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 220182, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 27.011388195580594, + "eval_chrf_word_order": 2, + "eval_loss": 2.4762187004089355, + "eval_meteor": 0.24310844060061812, + "eval_runtime": 898.6997, + "eval_samples_per_second": 19.137, + "eval_scarebleu_bp": 0.9568097916868865, + "eval_scarebleu_counts": [ + 88829, + 27608, + 10040, + 3682 + ], + "eval_scarebleu_precisions": [ + 36.99867131498165, + 12.386267788884302, + 4.880372541585246, + 1.9516383797479089 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 7.777147587663673, + "eval_scarebleu_sys_len": 240087, + "eval_scarebleu_totals": [ + 240087, + 222892, + 205722, + 188662 + ], + "eval_steps_per_second": 0.599, + "eval_ter_num_edits": 168657, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 77.23486392299273, + "step": 73000 + }, + { + "epoch": 28.79, + "learning_rate": 4.314350572443743e-05, + "loss": 2.4885, + "step": 73500 + }, + { + "epoch": 28.79, + "eval_bleu_bleu": 0.06536537892755359, + "eval_bleu_brevity_penalty": 0.919469452374102, + "eval_bleu_length_ratio": 0.9225445800930842, + "eval_bleu_precisions": [ + 0.34662887868876324, + 0.11142092899303156, + 0.042027000797946905, + 0.01573555249537015 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 219823, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 27.001794458568824, + "eval_chrf_word_order": 2, + "eval_loss": 2.467904806137085, + "eval_meteor": 0.2450840065968893, + "eval_runtime": 905.7265, + "eval_samples_per_second": 18.988, + "eval_scarebleu_bp": 0.9580366294409757, + "eval_scarebleu_counts": [ + 89500, + 28006, + 10228, + 3768 + ], + "eval_scarebleu_precisions": [ + 37.23240508856736, + 12.548221894644401, + 4.964638840484038, + 1.9941466925637592 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 7.900764651286006, + "eval_scarebleu_sys_len": 240382, + "eval_scarebleu_totals": [ + 240382, + 223187, + 206017, + 188953 + ], + "eval_steps_per_second": 0.594, + "eval_ter_num_edits": 168207, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 77.02879071663102, + "step": 73500 + }, + { + "epoch": 28.99, + "learning_rate": 4.3094157125937625e-05, + "loss": 2.4921, + "step": 74000 + }, + { + "epoch": 28.99, + "eval_bleu_bleu": 0.06620184614856583, + "eval_bleu_brevity_penalty": 0.9210053764935396, + "eval_bleu_length_ratio": 0.9239672820517125, + "eval_bleu_precisions": [ + 0.34891579836665726, + 0.11227440914040214, + 0.04254162675305945, + 0.01601829308026326 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 220162, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 27.094356008707305, + "eval_chrf_word_order": 2, + "eval_loss": 2.4593911170959473, + "eval_meteor": 0.24705816236419825, + "eval_runtime": 900.0086, + "eval_samples_per_second": 19.109, + "eval_scarebleu_bp": 0.9550981324680194, + "eval_scarebleu_counts": [ + 89795, + 28126, + 10296, + 3804 + ], + "eval_scarebleu_precisions": [ + 37.46516130108981, + 12.641978416134412, + 5.014709033879483, + 2.020641994719984 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 7.949548021225385, + "eval_scarebleu_sys_len": 239676, + "eval_scarebleu_totals": [ + 239676, + 222481, + 205316, + 188257 + ], + "eval_steps_per_second": 0.598, + "eval_ter_num_edits": 167721, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 76.80623165376038, + "step": 74000 + }, + { + "epoch": 29.18, + "learning_rate": 4.304490722463482e-05, + "loss": 2.4586, + "step": 74500 + }, + { + "epoch": 29.18, + "eval_bleu_bleu": 0.06598183440029617, + "eval_bleu_brevity_penalty": 0.9272129443710682, + "eval_bleu_length_ratio": 0.929737828344084, + "eval_bleu_precisions": [ + 0.344028311297887, + 0.1111421049025653, + 0.042097390282340996, + 0.015931314935828122 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 221537, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 27.278076124383688, + "eval_chrf_word_order": 2, + "eval_loss": 2.4666826725006104, + "eval_meteor": 0.2458254107161909, + "eval_runtime": 899.5756, + "eval_samples_per_second": 19.118, + "eval_scarebleu_bp": 0.967008762422872, + "eval_scarebleu_counts": [ + 89618, + 28159, + 10332, + 3864 + ], + "eval_scarebleu_precisions": [ + 36.948258091115235, + 12.495396152736793, + 4.962917419206087, + 2.021808744427468 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 7.977846736534355, + "eval_scarebleu_sys_len": 242550, + "eval_scarebleu_totals": [ + 242550, + 225355, + 208184, + 191116 + ], + "eval_steps_per_second": 0.598, + "eval_ter_num_edits": 168304, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 77.07321094111343, + "step": 74500 + }, + { + "epoch": 29.38, + "learning_rate": 4.299555862613502e-05, + "loss": 2.4622, + "step": 75000 + }, + { + "epoch": 29.38, + "eval_bleu_bleu": 0.06688924299788863, + "eval_bleu_brevity_penalty": 0.9249462315790966, + "eval_bleu_length_ratio": 0.927626857591311, + "eval_bleu_precisions": [ + 0.34723164761982317, + 0.11257904522687022, + 0.04288530350753144, + 0.01631450210709339 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 221034, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 27.39288828947749, + "eval_chrf_word_order": 2, + "eval_loss": 2.4598822593688965, + "eval_meteor": 0.24752760923740552, + "eval_runtime": 905.8573, + "eval_samples_per_second": 18.985, + "eval_scarebleu_bp": 0.9672065319482221, + "eval_scarebleu_counts": [ + 90292, + 28469, + 10487, + 3933 + ], + "eval_scarebleu_precisions": [ + 37.218773444133916, + 12.630266677905796, + 5.0361854269015955, + 2.0573742192649322 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 8.080097782354539, + "eval_scarebleu_sys_len": 242598, + "eval_scarebleu_totals": [ + 242598, + 225403, + 208233, + 191166 + ], + "eval_steps_per_second": 0.594, + "eval_ter_num_edits": 167873, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 76.87583860346477, + "step": 75000 + }, + { + "epoch": 29.57, + "learning_rate": 4.294621002763522e-05, + "loss": 2.4555, + "step": 75500 + }, + { + "epoch": 29.57, + "eval_bleu_bleu": 0.06720895138309266, + "eval_bleu_brevity_penalty": 0.9261680535320054, + "eval_bleu_length_ratio": 0.9287641798060257, + "eval_bleu_precisions": [ + 0.3480852217527846, + 0.11288520895595512, + 0.042924079204955126, + 0.016440903367031103 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 221305, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 27.36070988647066, + "eval_chrf_word_order": 2, + "eval_loss": 2.4501144886016846, + "eval_meteor": 0.24848768967540952, + "eval_runtime": 923.9655, + "eval_samples_per_second": 18.613, + "eval_scarebleu_bp": 0.9633556013142526, + "eval_scarebleu_counts": [ + 90244, + 28543, + 10481, + 3937 + ], + "eval_scarebleu_precisions": [ + 37.34260236277492, + 12.715730387134139, + 5.0559087707788635, + 2.0695020474245553 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 8.087967025527, + "eval_scarebleu_sys_len": 241665, + "eval_scarebleu_totals": [ + 241665, + 224470, + 207302, + 190239 + ], + "eval_steps_per_second": 0.582, + "eval_ter_num_edits": 167555, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 76.73021353763583, + "step": 75500 + }, + { + "epoch": 29.77, + "learning_rate": 4.289686142913542e-05, + "loss": 2.4559, + "step": 76000 + }, + { + "epoch": 29.77, + "eval_bleu_bleu": 0.06779550545474074, + "eval_bleu_brevity_penalty": 0.9298476941818343, + "eval_bleu_length_ratio": 0.9321971302548693, + "eval_bleu_precisions": [ + 0.34813594269841486, + 0.11352767801374142, + 0.04321684578269622, + 0.016544462143928036 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 222123, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 27.471293823021636, + "eval_chrf_word_order": 2, + "eval_loss": 2.4473018646240234, + "eval_meteor": 0.2494442970509638, + "eval_runtime": 899.0605, + "eval_samples_per_second": 19.129, + "eval_scarebleu_bp": 0.9660234717580519, + "eval_scarebleu_counts": [ + 90540, + 28724, + 10561, + 3973 + ], + "eval_scarebleu_precisions": [ + 37.36520422102174, + 12.759643916913946, + 5.07862466939168, + 2.081412405699916 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 8.139359326889949, + "eval_scarebleu_sys_len": 242311, + "eval_scarebleu_totals": [ + 242311, + 225116, + 207950, + 190880 + ], + "eval_steps_per_second": 0.598, + "eval_ter_num_edits": 167512, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 76.71052209791684, + "step": 76000 + }, + { + "epoch": 29.96, + "learning_rate": 4.284761152783261e-05, + "loss": 2.4625, + "step": 76500 + }, + { + "epoch": 29.96, + "eval_bleu_bleu": 0.06813441764997567, + "eval_bleu_brevity_penalty": 0.928751414050255, + "eval_bleu_length_ratio": 0.931173120585532, + "eval_bleu_precisions": [ + 0.34965454143925295, + 0.11408805768892537, + 0.04360948764984429, + 0.01664975691003032 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 221879, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 27.498826146986126, + "eval_chrf_word_order": 2, + "eval_loss": 2.4393856525421143, + "eval_meteor": 0.2504070921672424, + "eval_runtime": 894.9924, + "eval_samples_per_second": 19.216, + "eval_scarebleu_bp": 0.9643062494976016, + "eval_scarebleu_counts": [ + 90764, + 28796, + 10665, + 4014 + ], + "eval_scarebleu_precisions": [ + 37.52206535893673, + 12.81530930129061, + 5.139016045872886, + 2.107484879032258 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 8.191813354857814, + "eval_scarebleu_sys_len": 241895, + "eval_scarebleu_totals": [ + 241895, + 224700, + 207530, + 190464 + ], + "eval_steps_per_second": 0.601, + "eval_ter_num_edits": 167281, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 76.60473785198448, + "step": 76500 + }, + { + "epoch": 30.16, + "learning_rate": 4.279826292933281e-05, + "loss": 2.4251, + "step": 77000 + }, + { + "epoch": 30.16, + "eval_bleu_bleu": 0.06779490763415988, + "eval_bleu_brevity_penalty": 0.9281129008160122, + "eval_bleu_length_ratio": 0.9305771805320654, + "eval_bleu_precisions": [ + 0.34690196043060023, + 0.11361969668821073, + 0.04317802195456462, + 0.016728689996830352 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 221737, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 27.603745898120497, + "eval_chrf_word_order": 2, + "eval_loss": 2.4478092193603516, + "eval_meteor": 0.24876313223406832, + "eval_runtime": 884.6044, + "eval_samples_per_second": 19.441, + "eval_scarebleu_bp": 0.9682071599052247, + "eval_scarebleu_counts": [ + 90409, + 28773, + 10577, + 3996 + ], + "eval_scarebleu_precisions": [ + 37.2297099748395, + 12.751389344371272, + 5.073461341059206, + 2.0877415714487233 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 8.153148516355506, + "eval_scarebleu_sys_len": 242841, + "eval_scarebleu_totals": [ + 242841, + 225646, + 208477, + 191403 + ], + "eval_steps_per_second": 0.608, + "eval_ter_num_edits": 167835, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 76.85843686603869, + "step": 77000 + }, + { + "epoch": 30.36, + "learning_rate": 4.274891433083301e-05, + "loss": 2.426, + "step": 77500 + }, + { + "epoch": 30.36, + "eval_bleu_bleu": 0.06886453149564756, + "eval_bleu_brevity_penalty": 0.9253656840941981, + "eval_bleu_length_ratio": 0.9280171563587223, + "eval_bleu_precisions": [ + 0.35176165732814174, + 0.11559735598140557, + 0.044229451321368914, + 0.017053788650836194 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 221127, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 27.6604395840679, + "eval_chrf_word_order": 2, + "eval_loss": 2.4327285289764404, + "eval_meteor": 0.25215675567240114, + "eval_runtime": 911.8491, + "eval_samples_per_second": 18.861, + "eval_scarebleu_bp": 0.9612693939564749, + "eval_scarebleu_counts": [ + 90994, + 29106, + 10766, + 4089 + ], + "eval_scarebleu_precisions": [ + 37.73163985884948, + 12.995722565032192, + 5.206096829725913, + 2.155190588632147 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 8.27887115648222, + "eval_scarebleu_sys_len": 241161, + "eval_scarebleu_totals": [ + 241161, + 223966, + 206796, + 189728 + ], + "eval_steps_per_second": 0.59, + "eval_ter_num_edits": 166962, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 76.45865484569696, + "step": 77500 + }, + { + "epoch": 30.55, + "learning_rate": 4.2699565732333205e-05, + "loss": 2.4316, + "step": 78000 + }, + { + "epoch": 30.55, + "eval_bleu_bleu": 0.06877581577294974, + "eval_bleu_brevity_penalty": 0.9192155214962567, + "eval_bleu_length_ratio": 0.9223095614804494, + "eval_bleu_precisions": [ + 0.35191816787779784, + 0.11610192919060877, + 0.04475784704994067, + 0.017136546089352302 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 219767, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 27.60406398760502, + "eval_chrf_word_order": 2, + "eval_loss": 2.427431583404541, + "eval_meteor": 0.2511984519035508, + "eval_runtime": 895.7037, + "eval_samples_per_second": 19.201, + "eval_scarebleu_bp": 0.9654004821173208, + "eval_scarebleu_counts": [ + 91145, + 29182, + 10837, + 4078 + ], + "eval_scarebleu_precisions": [ + 37.63833828873472, + 12.971795612650856, + 5.2152612683715605, + 2.138100980443559 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 8.292609534482864, + "eval_scarebleu_sys_len": 242160, + "eval_scarebleu_totals": [ + 242160, + 224965, + 207794, + 190730 + ], + "eval_steps_per_second": 0.601, + "eval_ter_num_edits": 166945, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 76.45086985790107, + "step": 78000 + }, + { + "epoch": 30.75, + "learning_rate": 4.26503158310304e-05, + "loss": 2.439, + "step": 78500 + }, + { + "epoch": 30.75, + "eval_bleu_bleu": 0.06896402962453387, + "eval_bleu_brevity_penalty": 0.9261410170737261, + "eval_bleu_length_ratio": 0.9287389992403863, + "eval_bleu_precisions": [ + 0.35145662655502286, + 0.11536765570493474, + 0.044508988986418904, + 0.01703642676396163 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 221299, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 27.795770403839676, + "eval_chrf_word_order": 2, + "eval_loss": 2.423835515975952, + "eval_meteor": 0.25227257394204383, + "eval_runtime": 886.5255, + "eval_samples_per_second": 19.399, + "eval_scarebleu_bp": 0.9584189417870176, + "eval_scarebleu_counts": [ + 90807, + 29027, + 10790, + 4074 + ], + "eval_scarebleu_precisions": [ + 37.76167070036678, + 13.000326945212045, + 5.235094052176276, + 2.1550652497050935 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 8.26804792399512, + "eval_scarebleu_sys_len": 240474, + "eval_scarebleu_totals": [ + 240474, + 223279, + 206109, + 189043 + ], + "eval_steps_per_second": 0.607, + "eval_ter_num_edits": 166894, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 76.42751489451342, + "step": 78500 + }, + { + "epoch": 30.94, + "learning_rate": 4.26009672325306e-05, + "loss": 2.4299, + "step": 79000 + }, + { + "epoch": 30.94, + "eval_bleu_bleu": 0.06965336116182497, + "eval_bleu_brevity_penalty": 0.9286974698226388, + "eval_bleu_length_ratio": 0.9311227594542532, + "eval_bleu_precisions": [ + 0.3518819833503856, + 0.11634224515322077, + 0.04487011982785744, + 0.017225806451612903 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 221867, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 27.893918748872775, + "eval_chrf_word_order": 2, + "eval_loss": 2.418041706085205, + "eval_meteor": 0.25311324234101396, + "eval_runtime": 894.1472, + "eval_samples_per_second": 19.234, + "eval_scarebleu_bp": 0.962201254043897, + "eval_scarebleu_counts": [ + 91137, + 29261, + 10883, + 4092 + ], + "eval_scarebleu_precisions": [ + 37.75571077030151, + 13.051817423536182, + 5.257005395640014, + 2.1542170958079105 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 8.316417841078453, + "eval_scarebleu_sys_len": 241386, + "eval_scarebleu_totals": [ + 241386, + 224191, + 207019, + 189953 + ], + "eval_steps_per_second": 0.602, + "eval_ter_num_edits": 166756, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 76.36431911122916, + "step": 79000 + }, + { + "epoch": 31.14, + "learning_rate": 4.2551618634030795e-05, + "loss": 2.4129, + "step": 79500 + }, + { + "epoch": 31.14, + "eval_bleu_bleu": 0.07007993110442366, + "eval_bleu_brevity_penalty": 0.9318441843146127, + "eval_bleu_length_ratio": 0.9340646888731278, + "eval_bleu_precisions": [ + 0.3512858991409367, + 0.11655378262965434, + 0.04489934704416616, + 0.017401005858747525 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 222568, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 28.0220489845432, + "eval_chrf_word_order": 2, + "eval_loss": 2.4172847270965576, + "eval_meteor": 0.25404311437875043, + "eval_runtime": 890.9005, + "eval_samples_per_second": 19.304, + "eval_scarebleu_bp": 0.9679931152351775, + "eval_scarebleu_counts": [ + 91498, + 29482, + 10995, + 4185 + ], + "eval_scarebleu_precisions": [ + 37.68622136917241, + 13.0686099807619, + 5.275228257375484, + 2.187023140115805 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 8.404249268184694, + "eval_scarebleu_sys_len": 242789, + "eval_scarebleu_totals": [ + 242789, + 225594, + 208427, + 191356 + ], + "eval_steps_per_second": 0.604, + "eval_ter_num_edits": 166752, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 76.36248734939484, + "step": 79500 + }, + { + "epoch": 31.34, + "learning_rate": 4.250227003553099e-05, + "loss": 2.3965, + "step": 80000 + }, + { + "epoch": 31.34, + "eval_bleu_bleu": 0.07004388071448517, + "eval_bleu_brevity_penalty": 0.9315886612170275, + "eval_bleu_length_ratio": 0.933825473499553, + "eval_bleu_precisions": [ + 0.3516500307849949, + 0.11641567145278497, + 0.04480181970854902, + 0.017424738219895288 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 222511, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 28.08122807175664, + "eval_chrf_word_order": 2, + "eval_loss": 2.4134795665740967, + "eval_meteor": 0.2540396489359582, + "eval_runtime": 908.9921, + "eval_samples_per_second": 18.92, + "eval_scarebleu_bp": 0.9700945932910068, + "eval_scarebleu_counts": [ + 91687, + 29590, + 10973, + 4172 + ], + "eval_scarebleu_precisions": [ + 37.684751335799426, + 13.086840184869862, + 5.251897728469277, + 2.174513575073361 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 8.403956450234203, + "eval_scarebleu_sys_len": 243300, + "eval_scarebleu_totals": [ + 243300, + 226105, + 208934, + 191859 + ], + "eval_steps_per_second": 0.592, + "eval_ter_num_edits": 166550, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 76.26998337676135, + "step": 80000 + }, + { + "epoch": 31.53, + "learning_rate": 4.245302013422819e-05, + "loss": 2.4055, + "step": 80500 + }, + { + "epoch": 31.53, + "eval_bleu_bleu": 0.07044269819277872, + "eval_bleu_brevity_penalty": 0.9313196238235444, + "eval_bleu_length_ratio": 0.9335736678431586, + "eval_bleu_precisions": [ + 0.3526844113984653, + 0.11694664224188331, + 0.0451500749577366, + 0.017575853220875928 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 222451, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 28.112452029890566, + "eval_chrf_word_order": 2, + "eval_loss": 2.4083094596862793, + "eval_meteor": 0.25471256124839076, + "eval_runtime": 928.8116, + "eval_samples_per_second": 18.516, + "eval_scarebleu_bp": 0.9622840456433412, + "eval_scarebleu_counts": [ + 91493, + 29517, + 11017, + 4209 + ], + "eval_scarebleu_precisions": [ + 37.90005219422881, + 13.164831341905616, + 5.321116869442579, + 2.2155313537954595 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 8.42727637217431, + "eval_scarebleu_sys_len": 241406, + "eval_scarebleu_totals": [ + 241406, + 224211, + 207043, + 189977 + ], + "eval_steps_per_second": 0.579, + "eval_ter_num_edits": 166408, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 76.20495583164278, + "step": 80500 + }, + { + "epoch": 31.73, + "learning_rate": 4.240367153572839e-05, + "loss": 2.4095, + "step": 81000 + }, + { + "epoch": 31.73, + "eval_bleu_bleu": 0.07042339450095542, + "eval_bleu_brevity_penalty": 0.9336266690319568, + "eval_bleu_length_ratio": 0.9357349997272105, + "eval_bleu_precisions": [ + 0.35138541302261334, + 0.11690179860135783, + 0.0451224684550949, + 0.017465340303152152 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 222966, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 28.241957566911523, + "eval_chrf_word_order": 2, + "eval_loss": 2.4066855907440186, + "eval_meteor": 0.2547593694341076, + "eval_runtime": 890.4984, + "eval_samples_per_second": 19.313, + "eval_scarebleu_bp": 0.9628923615500885, + "eval_scarebleu_counts": [ + 91223, + 29496, + 10993, + 4164 + ], + "eval_scarebleu_precisions": [ + 37.76521094749393, + 13.146845666301179, + 5.305732391850998, + 2.190172625998043 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 8.39193349462186, + "eval_scarebleu_sys_len": 241553, + "eval_scarebleu_totals": [ + 241553, + 224358, + 207191, + 190122 + ], + "eval_steps_per_second": 0.604, + "eval_ter_num_edits": 166603, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 76.29425422106618, + "step": 81000 + }, + { + "epoch": 31.92, + "learning_rate": 4.235432293722859e-05, + "loss": 2.4086, + "step": 81500 + }, + { + "epoch": 31.92, + "eval_bleu_bleu": 0.07090889755906221, + "eval_bleu_brevity_penalty": 0.9280184406794167, + "eval_bleu_length_ratio": 0.9304890485523273, + "eval_bleu_precisions": [ + 0.3533168557975067, + 0.1180563365131209, + 0.04579272653523051, + 0.017845402460787075 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 221716, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 28.263858007899906, + "eval_chrf_word_order": 2, + "eval_loss": 2.402545690536499, + "eval_meteor": 0.25541104351031135, + "eval_runtime": 919.2275, + "eval_samples_per_second": 18.709, + "eval_scarebleu_bp": 0.9628178930240309, + "eval_scarebleu_counts": [ + 91551, + 29739, + 11147, + 4255 + ], + "eval_scarebleu_precisions": [ + 37.903823462438154, + 13.256218240171169, + 5.380579328187825, + 2.238224990268587 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 8.491863681953527, + "eval_scarebleu_sys_len": 241535, + "eval_scarebleu_totals": [ + 241535, + 224340, + 207171, + 190106 + ], + "eval_steps_per_second": 0.585, + "eval_ter_num_edits": 166163, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 76.09276041929029, + "step": 81500 + }, + { + "epoch": 32.12, + "learning_rate": 4.230497433872878e-05, + "loss": 2.3852, + "step": 82000 + }, + { + "epoch": 32.12, + "eval_bleu_bleu": 0.0708220989649878, + "eval_bleu_brevity_penalty": 0.9218788421413443, + "eval_bleu_length_ratio": 0.9247772569131144, + "eval_bleu_precisions": [ + 0.3546912935944272, + 0.11865524709588501, + 0.04607204872777709, + 0.017964071856287425 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 220355, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 28.258856123531846, + "eval_chrf_word_order": 2, + "eval_loss": 2.403284788131714, + "eval_meteor": 0.25583854833636993, + "eval_runtime": 908.3112, + "eval_samples_per_second": 18.934, + "eval_scarebleu_bp": 0.9582485807581953, + "eval_scarebleu_counts": [ + 91513, + 29740, + 11126, + 4260 + ], + "eval_scarebleu_precisions": [ + 38.06174693157761, + 13.322104659600964, + 5.399110015480102, + 2.253765534317019 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 8.49280792055298, + "eval_scarebleu_sys_len": 240433, + "eval_scarebleu_totals": [ + 240433, + 223238, + 206071, + 189017 + ], + "eval_steps_per_second": 0.592, + "eval_ter_num_edits": 166160, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 76.09138659791454, + "step": 82000 + }, + { + "epoch": 32.31, + "learning_rate": 4.225572443742598e-05, + "loss": 2.3766, + "step": 82500 + }, + { + "epoch": 32.31, + "eval_bleu_bleu": 0.07125108551342756, + "eval_bleu_brevity_penalty": 0.9277080133660088, + "eval_bleu_length_ratio": 0.9301994720474738, + "eval_bleu_precisions": [ + 0.35459085843706434, + 0.11878582748028878, + 0.04611951136169486, + 0.017911990462599177 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 221647, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 28.2453412650509, + "eval_chrf_word_order": 2, + "eval_loss": 2.3963427543640137, + "eval_meteor": 0.25600550593797305, + "eval_runtime": 889.1897, + "eval_samples_per_second": 19.341, + "eval_scarebleu_bp": 0.9629337306463684, + "eval_scarebleu_counts": [ + 91881, + 29903, + 11224, + 4262 + ], + "eval_scarebleu_precisions": [ + 38.03604028762683, + 13.327658133067104, + 5.4171191389753615, + 2.241624151896071 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 8.52936071808373, + "eval_scarebleu_sys_len": 241563, + "eval_scarebleu_totals": [ + 241563, + 224368, + 207195, + 190130 + ], + "eval_steps_per_second": 0.605, + "eval_ter_num_edits": 166107, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 76.06711575360971, + "step": 82500 + }, + { + "epoch": 32.51, + "learning_rate": 4.220637583892618e-05, + "loss": 2.3865, + "step": 83000 + }, + { + "epoch": 32.51, + "eval_bleu_bleu": 0.07125763872625927, + "eval_bleu_brevity_penalty": 0.9271904358350417, + "eval_bleu_length_ratio": 0.9297168445393845, + "eval_bleu_precisions": [ + 0.35547009009985014, + 0.11922950811649383, + 0.04619543441445003, + 0.017818209599031517 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 221532, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 28.324793957469247, + "eval_chrf_word_order": 2, + "eval_loss": 2.3915367126464844, + "eval_meteor": 0.25716167480951796, + "eval_runtime": 910.7642, + "eval_samples_per_second": 18.883, + "eval_scarebleu_bp": 0.9589215524493104, + "eval_scarebleu_counts": [ + 91810, + 29926, + 11216, + 4240 + ], + "eval_scarebleu_precisions": [ + 38.15956275068061, + 13.395702775290959, + 5.438587984289386, + 2.2414768371915987 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 8.519819746270617, + "eval_scarebleu_sys_len": 240595, + "eval_scarebleu_totals": [ + 240595, + 223400, + 206230, + 189161 + ], + "eval_steps_per_second": 0.591, + "eval_ter_num_edits": 165877, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 75.96178944813595, + "step": 83000 + }, + { + "epoch": 32.71, + "learning_rate": 4.2157027240426375e-05, + "loss": 2.3791, + "step": 83500 + }, + { + "epoch": 32.71, + "eval_bleu_bleu": 0.07206842318270457, + "eval_bleu_brevity_penalty": 0.9277395100663456, + "eval_bleu_length_ratio": 0.9302288493740531, + "eval_bleu_precisions": [ + 0.356285020798181, + 0.12012188262683472, + 0.046827617135779265, + 0.018169966114833715 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 221654, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 28.4257865861632, + "eval_chrf_word_order": 2, + "eval_loss": 2.3862781524658203, + "eval_meteor": 0.2582128417119766, + "eval_runtime": 884.4439, + "eval_samples_per_second": 19.445, + "eval_scarebleu_bp": 0.9634713789663382, + "eval_scarebleu_counts": [ + 92321, + 30230, + 11402, + 4353 + ], + "eval_scarebleu_precisions": [ + 38.19763087884217, + 13.465598802661939, + 5.499524905101603, + 2.2879939449367686 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 8.64170334338229, + "eval_scarebleu_sys_len": 241693, + "eval_scarebleu_totals": [ + 241693, + 224498, + 207327, + 190254 + ], + "eval_steps_per_second": 0.608, + "eval_ter_num_edits": 165637, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 75.85188373807638, + "step": 83500 + }, + { + "epoch": 32.9, + "learning_rate": 4.210767864192657e-05, + "loss": 2.3822, + "step": 84000 + }, + { + "epoch": 32.9, + "eval_bleu_bleu": 0.07261425133909395, + "eval_bleu_brevity_penalty": 0.9346732801747116, + "eval_bleu_length_ratio": 0.9367170417871487, + "eval_bleu_precisions": [ + 0.3554480286738351, + 0.11981262590713818, + 0.04679375165475245, + 0.018280226975120033 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 223200, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 28.491706937158582, + "eval_chrf_word_order": 2, + "eval_loss": 2.384209156036377, + "eval_meteor": 0.25869125905610824, + "eval_runtime": 870.2737, + "eval_samples_per_second": 19.762, + "eval_scarebleu_bp": 0.9684088152598506, + "eval_scarebleu_counts": [ + 92574, + 30334, + 11440, + 4408 + ], + "eval_scarebleu_precisions": [ + 38.11354934332414, + 13.440262300892797, + 5.4862053586414925, + 2.3024288325933666 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 8.685505260333144, + "eval_scarebleu_sys_len": 242890, + "eval_scarebleu_totals": [ + 242890, + 225695, + 208523, + 191450 + ], + "eval_steps_per_second": 0.618, + "eval_ter_num_edits": 165659, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 75.86195842816517, + "step": 84000 + }, + { + "epoch": 33.1, + "learning_rate": 4.205842874062377e-05, + "loss": 2.3584, + "step": 84500 + }, + { + "epoch": 33.1, + "eval_bleu_bleu": 0.07239294592423079, + "eval_bleu_brevity_penalty": 0.9304133690116866, + "eval_bleu_length_ratio": 0.9327259221332975, + "eval_bleu_precisions": [ + 0.3557631305427696, + 0.12011957825743463, + 0.046897285790314, + 0.018287687265917604 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 222249, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 28.512388227310947, + "eval_chrf_word_order": 2, + "eval_loss": 2.385260820388794, + "eval_meteor": 0.25862990349631804, + "eval_runtime": 874.1169, + "eval_samples_per_second": 19.675, + "eval_scarebleu_bp": 0.9618451750030134, + "eval_scarebleu_counts": [ + 92076, + 30187, + 11387, + 4374 + ], + "eval_scarebleu_precisions": [ + 38.15830915872358, + 13.470025211396443, + 5.502640900370644, + 2.3037421325678773 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 8.641632886947857, + "eval_scarebleu_sys_len": 241300, + "eval_scarebleu_totals": [ + 241300, + 224105, + 206937, + 189865 + ], + "eval_steps_per_second": 0.615, + "eval_ter_num_edits": 165599, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 75.83448200065027, + "step": 84500 + }, + { + "epoch": 33.29, + "learning_rate": 4.2009080142123966e-05, + "loss": 2.3525, + "step": 85000 + }, + { + "epoch": 33.29, + "eval_bleu_bleu": 0.07311997389466271, + "eval_bleu_brevity_penalty": 0.9333089051885471, + "eval_bleu_length_ratio": 0.9354370297004772, + "eval_bleu_precisions": [ + 0.35712330918145313, + 0.12086047642197374, + 0.0472457649592142, + 0.01847468693888021 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 222895, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 28.591652274837674, + "eval_chrf_word_order": 2, + "eval_loss": 2.378042697906494, + "eval_meteor": 0.26000738377369653, + "eval_runtime": 886.6908, + "eval_samples_per_second": 19.396, + "eval_scarebleu_bp": 0.9674001446268398, + "eval_scarebleu_counts": [ + 92952, + 30499, + 11517, + 4396 + ], + "eval_scarebleu_precisions": [ + 38.30781594510499, + 13.528055001108893, + 5.529602120232957, + 2.298994843473804 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 8.715550148578826, + "eval_scarebleu_sys_len": 242645, + "eval_scarebleu_totals": [ + 242645, + 225450, + 208279, + 191214 + ], + "eval_steps_per_second": 0.607, + "eval_ter_num_edits": 165353, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 75.7218286478392, + "step": 85000 + }, + { + "epoch": 33.49, + "learning_rate": 4.195973154362416e-05, + "loss": 2.3568, + "step": 85500 + }, + { + "epoch": 33.49, + "eval_bleu_bleu": 0.07357787015010725, + "eval_bleu_brevity_penalty": 0.9336803662880618, + "eval_bleu_length_ratio": 0.9357853608584894, + "eval_bleu_precisions": [ + 0.3571114639112379, + 0.12119076891677155, + 0.04769705452000764, + 0.01868233045464611 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 222978, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 28.740005317738653, + "eval_chrf_word_order": 2, + "eval_loss": 2.3725104331970215, + "eval_meteor": 0.2607324731548161, + "eval_runtime": 897.268, + "eval_samples_per_second": 19.167, + "eval_scarebleu_bp": 0.969050557892539, + "eval_scarebleu_counts": [ + 93026, + 30660, + 11622, + 4471 + ], + "eval_scarebleu_precisions": [ + 38.2750590423212, + 13.575321782945393, + 5.56931938527595, + 2.3334220566054475 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 8.784393706886583, + "eval_scarebleu_sys_len": 243046, + "eval_scarebleu_totals": [ + 243046, + 225851, + 208679, + 191607 + ], + "eval_steps_per_second": 0.6, + "eval_ter_num_edits": 165140, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 75.62428733016134, + "step": 85500 + }, + { + "epoch": 33.69, + "learning_rate": 4.191038294512436e-05, + "loss": 2.362, + "step": 86000 + }, + { + "epoch": 33.69, + "eval_bleu_bleu": 0.0731271627716459, + "eval_bleu_brevity_penalty": 0.9343558267817608, + "eval_bleu_length_ratio": 0.9364190717604153, + "eval_bleu_precisions": [ + 0.35704906130534353, + 0.12111647421018384, + 0.047336275075883186, + 0.01832907324060111 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 223129, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 28.664035555084862, + "eval_chrf_word_order": 2, + "eval_loss": 2.3666491508483887, + "eval_meteor": 0.26003482851751913, + "eval_runtime": 901.4795, + "eval_samples_per_second": 19.078, + "eval_scarebleu_bp": 0.9704765939803451, + "eval_scarebleu_counts": [ + 93107, + 30690, + 11611, + 4429 + ], + "eval_scarebleu_precisions": [ + 38.25377065075824, + 13.567759219798583, + 5.554837938045688, + 2.307347670250896 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 8.764492380722318, + "eval_scarebleu_sys_len": 243393, + "eval_scarebleu_totals": [ + 243393, + 226198, + 209025, + 191952 + ], + "eval_steps_per_second": 0.597, + "eval_ter_num_edits": 165229, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 75.6650440309751, + "step": 86000 + }, + { + "epoch": 33.88, + "learning_rate": 4.186113304382156e-05, + "loss": 2.3559, + "step": 86500 + }, + { + "epoch": 33.88, + "eval_bleu_bleu": 0.07316102978996578, + "eval_bleu_brevity_penalty": 0.9357367331156943, + "eval_bleu_length_ratio": 0.9377158708908464, + "eval_bleu_precisions": [ + 0.35635388787941175, + 0.12090107300611415, + 0.04707860890167541, + 0.018423377347963548 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 223438, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 28.713675544917294, + "eval_chrf_word_order": 2, + "eval_loss": 2.3652091026306152, + "eval_meteor": 0.26063586424126967, + "eval_runtime": 883.8207, + "eval_samples_per_second": 19.459, + "eval_scarebleu_bp": 0.9682565485307812, + "eval_scarebleu_counts": [ + 92858, + 30595, + 11556, + 4438 + ], + "eval_scarebleu_precisions": [ + 38.23629932510613, + 13.558127786296076, + 5.54273846581834, + 2.3185104693442553 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 8.747676196491083, + "eval_scarebleu_sys_len": 242853, + "eval_scarebleu_totals": [ + 242853, + 225658, + 208489, + 191416 + ], + "eval_steps_per_second": 0.609, + "eval_ter_num_edits": 165353, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 75.7218286478392, + "step": 86500 + }, + { + "epoch": 34.08, + "learning_rate": 4.181178444532175e-05, + "loss": 2.3499, + "step": 87000 + }, + { + "epoch": 34.08, + "eval_bleu_bleu": 0.0728810654415116, + "eval_bleu_brevity_penalty": 0.9265419884419029, + "eval_bleu_length_ratio": 0.9291125109640379, + "eval_bleu_precisions": [ + 0.35762552622545035, + 0.1211941643445172, + 0.04741766467065868, + 0.01862722032702035 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 221388, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 28.647710226627126, + "eval_chrf_word_order": 2, + "eval_loss": 2.365004539489746, + "eval_meteor": 0.25925639162041686, + "eval_runtime": 887.9707, + "eval_samples_per_second": 19.368, + "eval_scarebleu_bp": 0.9633886819611436, + "eval_scarebleu_counts": [ + 92683, + 30484, + 11536, + 4456 + ], + "eval_scarebleu_precisions": [ + 38.35058115718347, + 13.57994992827805, + 5.564613380927114, + 2.3422675210126 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 8.744539471017369, + "eval_scarebleu_sys_len": 241673, + "eval_scarebleu_totals": [ + 241673, + 224478, + 207310, + 190243 + ], + "eval_steps_per_second": 0.606, + "eval_ter_num_edits": 165222, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 75.66183844776502, + "step": 87000 + }, + { + "epoch": 34.27, + "learning_rate": 4.176243584682195e-05, + "loss": 2.3247, + "step": 87500 + }, + { + "epoch": 34.27, + "eval_bleu_bleu": 0.07297957987161788, + "eval_bleu_brevity_penalty": 0.9297623681889167, + "eval_bleu_length_ratio": 0.932117391797011, + "eval_bleu_precisions": [ + 0.3582105680221878, + 0.12184921111322587, + 0.04747118600737127, + 0.018320038420540932 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 222104, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 28.826964117547615, + "eval_chrf_word_order": 2, + "eval_loss": 2.364288330078125, + "eval_meteor": 0.26073469034350377, + "eval_runtime": 865.4229, + "eval_samples_per_second": 19.872, + "eval_scarebleu_bp": 0.9617871971025508, + "eval_scarebleu_counts": [ + 92724, + 30632, + 11529, + 4372 + ], + "eval_scarebleu_precisions": [ + 38.42908415738999, + 13.669446787242682, + 5.571610832962827, + 2.3027736518872 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 8.714445162831863, + "eval_scarebleu_sys_len": 241286, + "eval_scarebleu_totals": [ + 241286, + 224091, + 206924, + 189858 + ], + "eval_steps_per_second": 0.622, + "eval_ter_num_edits": 165028, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 75.57299799880019, + "step": 87500 + }, + { + "epoch": 34.47, + "learning_rate": 4.171308724832215e-05, + "loss": 2.3295, + "step": 88000 + }, + { + "epoch": 34.47, + "eval_bleu_bleu": 0.07405504108590318, + "eval_bleu_brevity_penalty": 0.9353347113714674, + "eval_bleu_length_ratio": 0.9373381624062549, + "eval_bleu_precisions": [ + 0.3567929867292297, + 0.12201132168826066, + 0.047782310333698404, + 0.01889151190240839 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 223348, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 28.933185455666727, + "eval_chrf_word_order": 2, + "eval_loss": 2.3654747009277344, + "eval_meteor": 0.2614959863908855, + "eval_runtime": 876.3421, + "eval_samples_per_second": 19.625, + "eval_scarebleu_bp": 0.966666696687835, + "eval_scarebleu_counts": [ + 92851, + 30829, + 11711, + 4513 + ], + "eval_scarebleu_precisions": [ + 38.294283345774886, + 13.6852338506339, + 5.627447682660196, + 2.362357227357908 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 8.831562733418528, + "eval_scarebleu_sys_len": 242467, + "eval_scarebleu_totals": [ + 242467, + 225272, + 208105, + 191038 + ], + "eval_steps_per_second": 0.614, + "eval_ter_num_edits": 165264, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 75.68107194702544, + "step": 88000 + }, + { + "epoch": 34.67, + "learning_rate": 4.166383734701935e-05, + "loss": 2.3364, + "step": 88500 + }, + { + "epoch": 34.67, + "eval_bleu_bleu": 0.07409147651816507, + "eval_bleu_brevity_penalty": 0.9367723589503645, + "eval_bleu_length_ratio": 0.9386895194289048, + "eval_bleu_precisions": [ + 0.35753565520633074, + 0.12211647899261412, + 0.04785523000617998, + 0.01872896111433546 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 223670, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 29.07477239757131, + "eval_chrf_word_order": 2, + "eval_loss": 2.3539936542510986, + "eval_meteor": 0.2626406869099012, + "eval_runtime": 898.047, + "eval_samples_per_second": 19.15, + "eval_scarebleu_bp": 0.9677913787041106, + "eval_scarebleu_counts": [ + 93149, + 30894, + 11696, + 4468 + ], + "eval_scarebleu_precisions": [ + 38.37398039054132, + 13.697488306102995, + 5.613011282651783, + 2.3355130758414484 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 8.81750572839245, + "eval_scarebleu_sys_len": 242740, + "eval_scarebleu_totals": [ + 242740, + 225545, + 208373, + 191307 + ], + "eval_steps_per_second": 0.599, + "eval_ter_num_edits": 164968, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 75.5455215712853, + "step": 88500 + }, + { + "epoch": 34.86, + "learning_rate": 4.161448874851954e-05, + "loss": 2.343, + "step": 89000 + }, + { + "epoch": 34.86, + "eval_bleu_bleu": 0.07464526333906671, + "eval_bleu_brevity_penalty": 0.9406959246320116, + "eval_bleu_length_ratio": 0.9423868658169625, + "eval_bleu_precisions": [ + 0.3573664779938633, + 0.12253805050251741, + 0.04803465898336453, + 0.018848312660245305 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 224551, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 29.06939233660405, + "eval_chrf_word_order": 2, + "eval_loss": 2.3495895862579346, + "eval_meteor": 0.2632219958151215, + "eval_runtime": 900.257, + "eval_samples_per_second": 19.103, + "eval_scarebleu_bp": 0.9733391379641829, + "eval_scarebleu_counts": [ + 93484, + 31187, + 11782, + 4528 + ], + "eval_scarebleu_precisions": [ + 38.298831173619675, + 13.74506381778436, + 5.617886450222437, + 2.3503519299046984 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 8.88737939345325, + "eval_scarebleu_sys_len": 244091, + "eval_scarebleu_totals": [ + 244091, + 226896, + 209723, + 192652 + ], + "eval_steps_per_second": 0.598, + "eval_ter_num_edits": 164981, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 75.55147479724687, + "step": 89000 + }, + { + "epoch": 35.06, + "learning_rate": 4.156514015001974e-05, + "loss": 2.3279, + "step": 89500 + }, + { + "epoch": 35.06, + "eval_bleu_bleu": 0.07515891457008701, + "eval_bleu_brevity_penalty": 0.9441354871200213, + "eval_bleu_length_ratio": 0.94563935554539, + "eval_bleu_precisions": [ + 0.3591773696777114, + 0.12302828507046043, + 0.048063882707160624, + 0.018908275604357698 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 225326, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 29.207786227121556, + "eval_chrf_word_order": 2, + "eval_loss": 2.344093084335327, + "eval_meteor": 0.2654288531205288, + "eval_runtime": 876.2683, + "eval_samples_per_second": 19.626, + "eval_scarebleu_bp": 0.976291739456298, + "eval_scarebleu_counts": [ + 94325, + 31416, + 11886, + 4570 + ], + "eval_scarebleu_precisions": [ + 38.52940816051435, + 13.802071892381095, + 5.647977875664656, + 2.3633815490750747 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 8.961288874266181, + "eval_scarebleu_sys_len": 244813, + "eval_scarebleu_totals": [ + 244813, + 227618, + 210447, + 193367 + ], + "eval_steps_per_second": 0.614, + "eval_ter_num_edits": 164656, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 75.40264414820786, + "step": 89500 + }, + { + "epoch": 35.25, + "learning_rate": 4.151579155151994e-05, + "loss": 2.319, + "step": 90000 + }, + { + "epoch": 35.25, + "eval_bleu_bleu": 0.0747117746870393, + "eval_bleu_brevity_penalty": 0.9293311438856731, + "eval_bleu_length_ratio": 0.93171450274678, + "eval_bleu_precisions": [ + 0.3602708010522143, + 0.12390326785897379, + 0.048726679775550334, + 0.019204172526957337 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 222008, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 29.127989451503677, + "eval_chrf_word_order": 2, + "eval_loss": 2.348289966583252, + "eval_meteor": 0.26297732782294936, + "eval_runtime": 905.9459, + "eval_samples_per_second": 18.983, + "eval_scarebleu_bp": 0.9624744412942555, + "eval_scarebleu_counts": [ + 93228, + 31079, + 11788, + 4545 + ], + "eval_scarebleu_precisions": [ + 38.611401023805975, + 13.85865324159335, + 5.692238602726364, + 2.3918409017950646 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 8.892056199745372, + "eval_scarebleu_sys_len": 241452, + "eval_scarebleu_totals": [ + 241452, + 224257, + 207089, + 190021 + ], + "eval_steps_per_second": 0.594, + "eval_ter_num_edits": 164658, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 75.40356002912502, + "step": 90000 + }, + { + "epoch": 35.45, + "learning_rate": 4.1466541650217136e-05, + "loss": 2.3108, + "step": 90500 + }, + { + "epoch": 35.45, + "eval_bleu_bleu": 0.07479715425112536, + "eval_bleu_brevity_penalty": 0.9326865312517306, + "eval_bleu_length_ratio": 0.9348536799298302, + "eval_bleu_precisions": [ + 0.36038535437878216, + 0.12411400995324989, + 0.048508235094293556, + 0.019063123621468333 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 222756, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 29.258269770478496, + "eval_chrf_word_order": 2, + "eval_loss": 2.3426177501678467, + "eval_meteor": 0.2644329072074268, + "eval_runtime": 890.3194, + "eval_samples_per_second": 19.317, + "eval_scarebleu_bp": 0.9686474584705574, + "eval_scarebleu_counts": [ + 93802, + 31379, + 11894, + 4595 + ], + "eval_scarebleu_precisions": [ + 38.60990829313268, + 13.89970454434714, + 5.70236839581935, + 2.399377571694133 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 8.966651579437588, + "eval_scarebleu_sys_len": 242948, + "eval_scarebleu_totals": [ + 242948, + 225753, + 208580, + 191508 + ], + "eval_steps_per_second": 0.604, + "eval_ter_num_edits": 164530, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 75.34494365042657, + "step": 90500 + }, + { + "epoch": 35.64, + "learning_rate": 4.141719305171733e-05, + "loss": 2.312, + "step": 91000 + }, + { + "epoch": 35.64, + "eval_bleu_bleu": 0.07542049656497743, + "eval_bleu_brevity_penalty": 0.9283467664794514, + "eval_bleu_length_ratio": 0.9307954121009405, + "eval_bleu_precisions": [ + 0.36173570375446934, + 0.12499389033891511, + 0.04939793103816215, + 0.01950418072465894 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 221789, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 29.178888898548, + "eval_chrf_word_order": 2, + "eval_loss": 2.3405649662017822, + "eval_meteor": 0.26393404146095045, + "eval_runtime": 872.3683, + "eval_samples_per_second": 19.714, + "eval_scarebleu_bp": 0.9655861804873429, + "eval_scarebleu_counts": [ + 93727, + 31428, + 12014, + 4651 + ], + "eval_scarebleu_precisions": [ + 38.69738444705931, + 13.967379227589884, + 5.7804358181092095, + 2.437988803388338 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.020658634204933, + "eval_scarebleu_sys_len": 242205, + "eval_scarebleu_totals": [ + 242205, + 225010, + 207839, + 190772 + ], + "eval_steps_per_second": 0.617, + "eval_ter_num_edits": 164357, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 75.26571995109195, + "step": 91000 + }, + { + "epoch": 35.84, + "learning_rate": 4.136784445321753e-05, + "loss": 2.2992, + "step": 91500 + }, + { + "epoch": 35.84, + "eval_bleu_bleu": 0.07554693855030378, + "eval_bleu_brevity_penalty": 0.9342216632453842, + "eval_bleu_length_ratio": 0.9362931689322181, + "eval_bleu_precisions": [ + 0.36040053967072916, + 0.12489315409122698, + 0.04908131476889822, + 0.019356529334692094 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 223099, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 29.304412621151776, + "eval_chrf_word_order": 2, + "eval_loss": 2.3346972465515137, + "eval_meteor": 0.2650141260115265, + "eval_runtime": 872.3574, + "eval_samples_per_second": 19.714, + "eval_scarebleu_bp": 0.962168135557369, + "eval_scarebleu_counts": [ + 93472, + 31403, + 11955, + 4619 + ], + "eval_scarebleu_precisions": [ + 38.72432450347588, + 14.007752594978209, + 5.774999637703912, + 2.431833378084543 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 8.988981623399184, + "eval_scarebleu_sys_len": 241378, + "eval_scarebleu_totals": [ + 241378, + 224183, + 207013, + 189939 + ], + "eval_steps_per_second": 0.617, + "eval_ter_num_edits": 164300, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 75.23961734495282, + "step": 91500 + }, + { + "epoch": 36.04, + "learning_rate": 4.1318495854717725e-05, + "loss": 2.3079, + "step": 92000 + }, + { + "epoch": 36.04, + "eval_bleu_bleu": 0.07646677013647557, + "eval_bleu_brevity_penalty": 0.9418732874936254, + "eval_bleu_length_ratio": 0.9434990074660378, + "eval_bleu_precisions": [ + 0.36098409365881434, + 0.12474171687835045, + 0.04941668154277494, + 0.019523051730897852 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 224816, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 29.467180089097532, + "eval_chrf_word_order": 2, + "eval_loss": 2.3307673931121826, + "eval_meteor": 0.2664864775674389, + "eval_runtime": 879.8501, + "eval_samples_per_second": 19.547, + "eval_scarebleu_bp": 0.9722327945564749, + "eval_scarebleu_counts": [ + 94387, + 31754, + 12181, + 4726 + ], + "eval_scarebleu_precisions": [ + 38.711595801838236, + 14.011631498592395, + 5.815541211519364, + 2.456532473945474 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.121806880247169, + "eval_scarebleu_sys_len": 243821, + "eval_scarebleu_totals": [ + 243821, + 226626, + 209456, + 192385 + ], + "eval_steps_per_second": 0.611, + "eval_ter_num_edits": 164086, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 75.14161808681635, + "step": 92000 + }, + { + "epoch": 36.23, + "learning_rate": 4.126914725621793e-05, + "loss": 2.2839, + "step": 92500 + }, + { + "epoch": 36.23, + "eval_bleu_bleu": 0.07679993724295256, + "eval_bleu_brevity_penalty": 0.9419354515204257, + "eval_bleu_length_ratio": 0.9435577621191964, + "eval_bleu_precisions": [ + 0.3612863052083797, + 0.12499819394610735, + 0.04955926900078224, + 0.019745983061693947 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 224830, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 29.473286688686116, + "eval_chrf_word_order": 2, + "eval_loss": 2.329514741897583, + "eval_meteor": 0.26732602625784074, + "eval_runtime": 875.8247, + "eval_samples_per_second": 19.636, + "eval_scarebleu_bp": 0.9749841557357122, + "eval_scarebleu_counts": [ + 94569, + 31786, + 12195, + 4741 + ], + "eval_scarebleu_precisions": [ + 38.67963499977505, + 13.984284947513837, + 5.803577802207216, + 2.455802292634665 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.135882786818003, + "eval_scarebleu_sys_len": 244493, + "eval_scarebleu_totals": [ + 244493, + 227298, + 210129, + 193053 + ], + "eval_steps_per_second": 0.614, + "eval_ter_num_edits": 164119, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 75.15673012194955, + "step": 92500 + }, + { + "epoch": 36.43, + "learning_rate": 4.121989735491512e-05, + "loss": 2.2931, + "step": 93000 + }, + { + "epoch": 36.43, + "eval_bleu_bleu": 0.07589528134830813, + "eval_bleu_brevity_penalty": 0.9338861808374684, + "eval_bleu_length_ratio": 0.9359784118617251, + "eval_bleu_precisions": [ + 0.3625842958605352, + 0.12576944939731524, + 0.049530139447615716, + 0.019312104582474048 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 223024, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 29.444126018974824, + "eval_chrf_word_order": 2, + "eval_loss": 2.323686361312866, + "eval_meteor": 0.26691631987833814, + "eval_runtime": 908.1157, + "eval_samples_per_second": 18.938, + "eval_scarebleu_bp": 0.9682112757142252, + "eval_scarebleu_counts": [ + 94301, + 31785, + 12114, + 4640 + ], + "eval_scarebleu_precisions": [ + 38.83224483408966, + 14.08616112777923, + 5.810712932361843, + 2.424115772425683 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.07114518178547, + "eval_scarebleu_sys_len": 242842, + "eval_scarebleu_totals": [ + 242842, + 225647, + 208477, + 191410 + ], + "eval_steps_per_second": 0.592, + "eval_ter_num_edits": 163917, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 75.06422614931607, + "step": 93000 + }, + { + "epoch": 36.62, + "learning_rate": 4.117054875641532e-05, + "loss": 2.2968, + "step": 93500 + }, + { + "epoch": 36.62, + "eval_bleu_bleu": 0.07661100633758544, + "eval_bleu_brevity_penalty": 0.9402023773065159, + "eval_bleu_length_ratio": 0.9419210253526329, + "eval_bleu_precisions": [ + 0.3622259846729638, + 0.12552293179570073, + 0.04957151650016571, + 0.019558899154662645 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 224440, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 29.55864375072351, + "eval_chrf_word_order": 2, + "eval_loss": 2.317932367324829, + "eval_meteor": 0.2682298784027859, + "eval_runtime": 886.7494, + "eval_samples_per_second": 19.394, + "eval_scarebleu_bp": 0.9688120078612469, + "eval_scarebleu_counts": [ + 94374, + 31757, + 12136, + 4675 + ], + "eval_scarebleu_precisions": [ + 38.838955010123954, + 14.064652137134456, + 5.817191776553879, + 2.440616027146959 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.091632155333356, + "eval_scarebleu_sys_len": 242988, + "eval_scarebleu_totals": [ + 242988, + 225793, + 208623, + 191550 + ], + "eval_steps_per_second": 0.607, + "eval_ter_num_edits": 163793, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 75.00744153245195, + "step": 93500 + }, + { + "epoch": 36.82, + "learning_rate": 4.112120015791552e-05, + "loss": 2.2879, + "step": 94000 + }, + { + "epoch": 36.82, + "eval_bleu_bleu": 0.07703770935912604, + "eval_bleu_brevity_penalty": 0.9430182974300813, + "eval_bleu_length_ratio": 0.9445817717885336, + "eval_bleu_precisions": [ + 0.3620009419124377, + 0.12532771468017453, + 0.04972656680106752, + 0.01974184188103079 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 225074, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 29.64734105233926, + "eval_chrf_word_order": 2, + "eval_loss": 2.3176047801971436, + "eval_meteor": 0.267958556875353, + "eval_runtime": 884.8265, + "eval_samples_per_second": 19.437, + "eval_scarebleu_bp": 0.9720933928121399, + "eval_scarebleu_counts": [ + 94649, + 31863, + 12198, + 4757 + ], + "eval_scarebleu_precisions": [ + 38.824465619577744, + 14.061838017229205, + 5.8246029547994, + 2.4731473490480695 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.154275222515736, + "eval_scarebleu_sys_len": 243787, + "eval_scarebleu_totals": [ + 243787, + 226592, + 209422, + 192346 + ], + "eval_steps_per_second": 0.608, + "eval_ter_num_edits": 163804, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 75.01247887749635, + "step": 94000 + }, + { + "epoch": 37.02, + "learning_rate": 4.1071851559415715e-05, + "loss": 2.2793, + "step": 94500 + }, + { + "epoch": 37.02, + "eval_bleu_bleu": 0.0773086326215184, + "eval_bleu_brevity_penalty": 0.9425835166791262, + "eval_bleu_length_ratio": 0.9441704892164228, + "eval_bleu_precisions": [ + 0.3622030794395847, + 0.12595954394290143, + 0.050052197816609925, + 0.019816467253863924 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 224976, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 29.669618057635773, + "eval_chrf_word_order": 2, + "eval_loss": 2.3161532878875732, + "eval_meteor": 0.2684858427754471, + "eval_runtime": 868.344, + "eval_samples_per_second": 19.806, + "eval_scarebleu_bp": 0.9741005932772707, + "eval_scarebleu_counts": [ + 94799, + 32015, + 12269, + 4770 + ], + "eval_scarebleu_precisions": [ + 38.807992565816676, + 14.09843140363393, + 5.844913748338565, + 2.4735788589385908 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.18655687542055, + "eval_scarebleu_sys_len": 244277, + "eval_scarebleu_totals": [ + 244277, + 227082, + 209909, + 192838 + ], + "eval_steps_per_second": 0.62, + "eval_ter_num_edits": 163772, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 74.99782478282174, + "step": 94500 + }, + { + "epoch": 37.21, + "learning_rate": 4.102260165811291e-05, + "loss": 2.2622, + "step": 95000 + }, + { + "epoch": 37.21, + "eval_bleu_bleu": 0.07675568399499894, + "eval_bleu_brevity_penalty": 0.9384085628247145, + "eval_bleu_length_ratio": 0.9402297306938505, + "eval_bleu_precisions": [ + 0.36326142556809815, + 0.12633314317208305, + 0.04998312983699205, + 0.01951256240660728 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 224037, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 29.635722125106405, + "eval_chrf_word_order": 2, + "eval_loss": 2.3132102489471436, + "eval_meteor": 0.2679480709181488, + "eval_runtime": 878.4365, + "eval_samples_per_second": 19.578, + "eval_scarebleu_bp": 0.9690834570182909, + "eval_scarebleu_counts": [ + 94606, + 31943, + 12191, + 4691 + ], + "eval_scarebleu_precisions": [ + 38.92386054127889, + 14.14289446070336, + 5.841735030284444, + 2.4481637467186466 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.12841363910043, + "eval_scarebleu_sys_len": 243054, + "eval_scarebleu_totals": [ + 243054, + 225859, + 208688, + 191613 + ], + "eval_steps_per_second": 0.612, + "eval_ter_num_edits": 163606, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 74.9218066666972, + "step": 95000 + }, + { + "epoch": 37.41, + "learning_rate": 4.097325305961311e-05, + "loss": 2.2697, + "step": 95500 + }, + { + "epoch": 37.41, + "eval_bleu_bleu": 0.07811483134118752, + "eval_bleu_brevity_penalty": 0.9436790002842486, + "eval_bleu_length_ratio": 0.9452070891685797, + "eval_bleu_precisions": [ + 0.36331546955683924, + 0.12670409752533313, + 0.05052759527626712, + 0.020185227795674183 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 225223, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 29.76041090187295, + "eval_chrf_word_order": 2, + "eval_loss": 2.3119752407073975, + "eval_meteor": 0.26990671738236993, + "eval_runtime": 883.2672, + "eval_samples_per_second": 19.471, + "eval_scarebleu_bp": 0.9736626207530998, + "eval_scarebleu_counts": [ + 94964, + 32205, + 12407, + 4853 + ], + "eval_scarebleu_precisions": [ + 38.892574845394606, + 14.188787311377904, + 5.913727359389895, + 2.5180696010418884 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.270299139623567, + "eval_scarebleu_sys_len": 244170, + "eval_scarebleu_totals": [ + 244170, + 226975, + 209800, + 192727 + ], + "eval_steps_per_second": 0.609, + "eval_ter_num_edits": 163504, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 74.87509673992187, + "step": 95500 + }, + { + "epoch": 37.6, + "learning_rate": 4.0923904461113306e-05, + "loss": 2.2607, + "step": 96000 + }, + { + "epoch": 37.6, + "eval_bleu_bleu": 0.07726800150507071, + "eval_bleu_brevity_penalty": 0.9410603800822139, + "eval_bleu_length_ratio": 0.9427310002140348, + "eval_bleu_precisions": [ + 0.3638334527874355, + 0.12639439254138585, + 0.049920906448883494, + 0.019797751252510792 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 224633, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 29.76805497242343, + "eval_chrf_word_order": 2, + "eval_loss": 2.3069493770599365, + "eval_meteor": 0.26956051877423587, + "eval_runtime": 878.7389, + "eval_samples_per_second": 19.571, + "eval_scarebleu_bp": 0.9732121738481007, + "eval_scarebleu_counts": [ + 95087, + 32094, + 12273, + 4781 + ], + "eval_scarebleu_precisions": [ + 38.96050151602065, + 14.146739250214885, + 5.85281410054651, + 2.4821277457337616 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.20608476935374, + "eval_scarebleu_sys_len": 244060, + "eval_scarebleu_totals": [ + 244060, + 226865, + 209694, + 192617 + ], + "eval_steps_per_second": 0.612, + "eval_ter_num_edits": 163479, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 74.86364822845734, + "step": 96000 + }, + { + "epoch": 37.8, + "learning_rate": 4.087455586261351e-05, + "loss": 2.2676, + "step": 96500 + }, + { + "epoch": 37.8, + "eval_bleu_bleu": 0.07859318206425986, + "eval_bleu_brevity_penalty": 0.941859966157248, + "eval_bleu_length_ratio": 0.943486417183218, + "eval_bleu_precisions": [ + 0.36602865492653897, + 0.12815844483618954, + 0.050923811173941125, + 0.020296022094987688 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 224813, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 29.867432281405886, + "eval_chrf_word_order": 2, + "eval_loss": 2.302855968475342, + "eval_meteor": 0.2717965919805728, + "eval_runtime": 900.6665, + "eval_samples_per_second": 19.095, + "eval_scarebleu_bp": 0.973777248432218, + "eval_scarebleu_counts": [ + 95681, + 32553, + 12530, + 4898 + ], + "eval_scarebleu_precisions": [ + 39.18172958009484, + 14.340339114461042, + 5.971443821724046, + 2.541009971051785 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.357111605827647, + "eval_scarebleu_sys_len": 244198, + "eval_scarebleu_totals": [ + 244198, + 227003, + 209832, + 192758 + ], + "eval_steps_per_second": 0.597, + "eval_ter_num_edits": 163122, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 74.70016348474371, + "step": 96500 + }, + { + "epoch": 37.99, + "learning_rate": 4.08253059613107e-05, + "loss": 2.2862, + "step": 97000 + }, + { + "epoch": 37.99, + "eval_bleu_bleu": 0.07829144457051927, + "eval_bleu_brevity_penalty": 0.9365760242949657, + "eval_bleu_length_ratio": 0.9385048619475489, + "eval_bleu_precisions": [ + 0.3656283258655076, + 0.12814451317873768, + 0.0511285584462244, + 0.02038363735587474 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 223626, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 29.83363765758708, + "eval_chrf_word_order": 2, + "eval_loss": 2.2980098724365234, + "eval_meteor": 0.27044078858742326, + "eval_runtime": 892.0434, + "eval_samples_per_second": 19.279, + "eval_scarebleu_bp": 0.9667656188882967, + "eval_scarebleu_counts": [ + 94980, + 32304, + 12440, + 4839 + ], + "eval_scarebleu_precisions": [ + 39.16846398423034, + 14.338470279099496, + 5.97729205606354, + 2.5328845781404574 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.283484283624713, + "eval_scarebleu_sys_len": 242491, + "eval_scarebleu_totals": [ + 242491, + 225296, + 208121, + 191047 + ], + "eval_steps_per_second": 0.603, + "eval_ter_num_edits": 163225, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 74.74733135197762, + "step": 97000 + }, + { + "epoch": 38.19, + "learning_rate": 4.07760560600079e-05, + "loss": 2.2376, + "step": 97500 + }, + { + "epoch": 38.19, + "eval_bleu_bleu": 0.07806705693434796, + "eval_bleu_brevity_penalty": 0.9360359178230517, + "eval_bleu_length_ratio": 0.9379970538738202, + "eval_bleu_precisions": [ + 0.3654325406590457, + 0.12796277446561, + 0.050986259509698706, + 0.020293509330482674 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 223505, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 29.90055896366798, + "eval_chrf_word_order": 2, + "eval_loss": 2.3027570247650146, + "eval_meteor": 0.2700245302305965, + "eval_runtime": 901.284, + "eval_samples_per_second": 19.082, + "eval_scarebleu_bp": 0.9689477413641532, + "eval_scarebleu_counts": [ + 95097, + 32336, + 12471, + 4833 + ], + "eval_scarebleu_precisions": [ + 39.13118619378572, + 14.318988956098943, + 5.976909030783166, + 2.5226532487055287 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.289508738984617, + "eval_scarebleu_sys_len": 243021, + "eval_scarebleu_totals": [ + 243021, + 225826, + 208653, + 191584 + ], + "eval_steps_per_second": 0.597, + "eval_ter_num_edits": 163182, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 74.72763991225861, + "step": 97500 + }, + { + "epoch": 38.39, + "learning_rate": 4.0726707461508093e-05, + "loss": 2.254, + "step": 98000 + }, + { + "epoch": 38.39, + "eval_bleu_bleu": 0.0786481776222588, + "eval_bleu_brevity_penalty": 0.9362368157616587, + "eval_bleu_length_ratio": 0.938185908116116, + "eval_bleu_precisions": [ + 0.36610154327890854, + 0.12856000581522134, + 0.05142842041280161, + 0.020573167756699928 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 223550, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 29.967953813668895, + "eval_chrf_word_order": 2, + "eval_loss": 2.2961905002593994, + "eval_meteor": 0.2707088263713494, + "eval_runtime": 919.6407, + "eval_samples_per_second": 18.701, + "eval_scarebleu_bp": 0.9717489075003207, + "eval_scarebleu_counts": [ + 95421, + 32541, + 12564, + 4925 + ], + "eval_scarebleu_precisions": [ + 39.154626738283895, + 14.36637999540855, + 6.001891713720657, + 2.561661933443602 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.371069590977255, + "eval_scarebleu_sys_len": 243703, + "eval_scarebleu_totals": [ + 243703, + 226508, + 209334, + 192258 + ], + "eval_steps_per_second": 0.585, + "eval_ter_num_edits": 163010, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 74.64887415338256, + "step": 98000 + }, + { + "epoch": 38.58, + "learning_rate": 4.067735886300829e-05, + "loss": 2.2443, + "step": 98500 + }, + { + "epoch": 38.58, + "eval_bleu_bleu": 0.07889351611138126, + "eval_bleu_brevity_penalty": 0.9365180094198068, + "eval_bleu_length_ratio": 0.9384503040553301, + "eval_bleu_precisions": [ + 0.36635168796089673, + 0.1289325543315021, + 0.051543123444591804, + 0.020685651252576272 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 223613, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 29.922021248251244, + "eval_chrf_word_order": 2, + "eval_loss": 2.294145345687866, + "eval_meteor": 0.2716128653311969, + "eval_runtime": 923.2399, + "eval_samples_per_second": 18.628, + "eval_scarebleu_bp": 0.9670540879467275, + "eval_scarebleu_counts": [ + 95200, + 32527, + 12593, + 4940 + ], + "eval_scarebleu_precisions": [ + 39.24785930137161, + 14.432966818419814, + 6.048656307788371, + 2.5846553095307856 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.381214093600267, + "eval_scarebleu_sys_len": 242561, + "eval_scarebleu_totals": [ + 242561, + 225366, + 208195, + 191128 + ], + "eval_steps_per_second": 0.583, + "eval_ter_num_edits": 162892, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 74.59483717926994, + "step": 98500 + }, + { + "epoch": 38.78, + "learning_rate": 4.062801026450849e-05, + "loss": 2.2542, + "step": 99000 + }, + { + "epoch": 38.78, + "eval_bleu_bleu": 0.07972522628696058, + "eval_bleu_brevity_penalty": 0.947568334120788, + "eval_bleu_length_ratio": 0.9488960420347575, + "eval_bleu_precisions": [ + 0.3643886387559597, + 0.12851173009999664, + 0.05154789719626168, + 0.02075976029259414 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 226102, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 30.07017722781491, + "eval_chrf_word_order": 2, + "eval_loss": 2.290343999862671, + "eval_meteor": 0.27256620197194575, + "eval_runtime": 899.3864, + "eval_samples_per_second": 19.122, + "eval_scarebleu_bp": 0.9773284471395728, + "eval_scarebleu_counts": [ + 95635, + 32718, + 12704, + 5021 + ], + "eval_scarebleu_precisions": [ + 39.02402200214635, + 14.358060665636849, + 6.029511573491791, + 2.5932372339491474 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.455371314758333, + "eval_scarebleu_sys_len": 245067, + "eval_scarebleu_totals": [ + 245067, + 227872, + 210697, + 193619 + ], + "eval_steps_per_second": 0.598, + "eval_ter_num_edits": 163002, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 74.64521062971392, + "step": 99000 + }, + { + "epoch": 38.97, + "learning_rate": 4.057866166600869e-05, + "loss": 2.2508, + "step": 99500 + }, + { + "epoch": 38.97, + "eval_bleu_bleu": 0.07930765541861483, + "eval_bleu_brevity_penalty": 0.9408648341570414, + "eval_bleu_length_ratio": 0.9425463427326789, + "eval_bleu_precisions": [ + 0.36611766382146943, + 0.12873564326836842, + 0.05159353858607947, + 0.020760446615169674 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 224589, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 29.970942112050498, + "eval_chrf_word_order": 2, + "eval_loss": 2.2870285511016846, + "eval_meteor": 0.2720466389884024, + "eval_runtime": 921.1729, + "eval_samples_per_second": 18.67, + "eval_scarebleu_bp": 0.9725115413763264, + "eval_scarebleu_counts": [ + 95657, + 32650, + 12666, + 4970 + ], + "eval_scarebleu_precisions": [ + 39.22153110636396, + 14.40267497154755, + 6.045102016465815, + 2.582448701760949 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.424222355703654, + "eval_scarebleu_sys_len": 243889, + "eval_scarebleu_totals": [ + 243889, + 226694, + 209525, + 192453 + ], + "eval_steps_per_second": 0.584, + "eval_ter_num_edits": 162968, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 74.62964065412216, + "step": 99500 + }, + { + "epoch": 39.17, + "learning_rate": 4.0529313067508886e-05, + "loss": 2.2233, + "step": 100000 + }, + { + "epoch": 39.17, + "eval_bleu_bleu": 0.08018700419805709, + "eval_bleu_brevity_penalty": 0.9420597686564607, + "eval_bleu_length_ratio": 0.9436752714255138, + "eval_bleu_precisions": [ + 0.36730292006510773, + 0.12970052440733304, + 0.05218263133582497, + 0.02111592139320117 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 224858, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 30.159129977422, + "eval_chrf_word_order": 2, + "eval_loss": 2.2875216007232666, + "eval_meteor": 0.27367568754490273, + "eval_runtime": 901.1796, + "eval_samples_per_second": 19.084, + "eval_scarebleu_bp": 0.9738754905460817, + "eval_scarebleu_counts": [ + 95888, + 32877, + 12776, + 5056 + ], + "eval_scarebleu_precisions": [ + 39.26263809157242, + 14.481537438278266, + 6.087984141506557, + 2.6226787011100736 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.50619291880752, + "eval_scarebleu_sys_len": 244222, + "eval_scarebleu_totals": [ + 244222, + 227027, + 209856, + 192780 + ], + "eval_steps_per_second": 0.597, + "eval_ter_num_edits": 162567, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 74.44600653023093, + "step": 100000 + }, + { + "epoch": 39.37, + "learning_rate": 4.047996446900908e-05, + "loss": 2.2308, + "step": 100500 + }, + { + "epoch": 39.37, + "eval_bleu_bleu": 0.0797771119491541, + "eval_bleu_brevity_penalty": 0.9417533894498044, + "eval_bleu_length_ratio": 0.9433856949206603, + "eval_bleu_precisions": [ + 0.36542713389000353, + 0.12922820505409596, + 0.051848623443727385, + 0.021031446250728055 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 224789, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 30.097205382777737, + "eval_chrf_word_order": 2, + "eval_loss": 2.285306453704834, + "eval_meteor": 0.2723363572969756, + "eval_runtime": 901.0927, + "eval_samples_per_second": 19.086, + "eval_scarebleu_bp": 0.9697124509912441, + "eval_scarebleu_counts": [ + 95169, + 32648, + 12640, + 4993 + ], + "eval_scarebleu_precisions": [ + 39.130863832044305, + 14.445250694653382, + 6.052422405454841, + 2.6036940855000363 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.42071571141444, + "eval_scarebleu_sys_len": 243207, + "eval_scarebleu_totals": [ + 243207, + 226012, + 208842, + 191766 + ], + "eval_steps_per_second": 0.597, + "eval_ter_num_edits": 163001, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 74.64475268925534, + "step": 100500 + }, + { + "epoch": 39.56, + "learning_rate": 4.043061587050928e-05, + "loss": 2.2297, + "step": 101000 + }, + { + "epoch": 39.56, + "eval_bleu_bleu": 0.08019106882457999, + "eval_bleu_brevity_penalty": 0.9414824588392638, + "eval_bleu_length_ratio": 0.9431296925033259, + "eval_bleu_precisions": [ + 0.3663050443202449, + 0.12986368432972106, + 0.05217624255413029, + 0.02120565330256706 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 224728, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 30.255804363441598, + "eval_chrf_word_order": 2, + "eval_loss": 2.2816460132598877, + "eval_meteor": 0.27332395023486145, + "eval_runtime": 902.6041, + "eval_samples_per_second": 19.054, + "eval_scarebleu_bp": 0.9722573929032882, + "eval_scarebleu_counts": [ + 95703, + 32865, + 12747, + 5056 + ], + "eval_scarebleu_precisions": [ + 39.25037013948414, + 14.501482579688659, + 6.085619757377268, + 2.627995218046676 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.496807622513906, + "eval_scarebleu_sys_len": 243827, + "eval_scarebleu_totals": [ + 243827, + 226632, + 209461, + 192390 + ], + "eval_steps_per_second": 0.596, + "eval_ter_num_edits": 162943, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 74.61819214265762, + "step": 101000 + }, + { + "epoch": 39.76, + "learning_rate": 4.0381365969206476e-05, + "loss": 2.2322, + "step": 101500 + }, + { + "epoch": 39.76, + "eval_bleu_bleu": 0.08050424427721393, + "eval_bleu_brevity_penalty": 0.9426278902262398, + "eval_bleu_length_ratio": 0.9442124568258218, + "eval_bleu_precisions": [ + 0.3673428568888731, + 0.13019331924866814, + 0.052446873803316356, + 0.02120967741935484 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 224986, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 30.23062608491317, + "eval_chrf_word_order": 2, + "eval_loss": 2.2783522605895996, + "eval_meteor": 0.27468902914210064, + "eval_runtime": 901.5634, + "eval_samples_per_second": 19.076, + "eval_scarebleu_bp": 0.977862716871039, + "eval_scarebleu_counts": [ + 96292, + 33103, + 12888, + 5083 + ], + "eval_scarebleu_precisions": [ + 39.271119666555194, + 14.518668614009465, + 6.1129240343021936, + 2.6234026301121 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.562168541163475, + "eval_scarebleu_sys_len": 245198, + "eval_scarebleu_totals": [ + 245198, + 228003, + 210832, + 193756 + ], + "eval_steps_per_second": 0.597, + "eval_ter_num_edits": 162554, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 74.44005330426938, + "step": 101500 + }, + { + "epoch": 39.95, + "learning_rate": 4.033201737070668e-05, + "loss": 2.2322, + "step": 102000 + }, + { + "epoch": 39.95, + "eval_bleu_bleu": 0.07962305278232948, + "eval_bleu_brevity_penalty": 0.9349414772498518, + "eval_bleu_length_ratio": 0.936968847443543, + "eval_bleu_precisions": [ + 0.3672803009943564, + 0.1303326620241186, + 0.05239615260419148, + 0.020973325188352678 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 223260, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 30.25351142912609, + "eval_chrf_word_order": 2, + "eval_loss": 2.274219274520874, + "eval_meteor": 0.27237740645799935, + "eval_runtime": 890.9064, + "eval_samples_per_second": 19.304, + "eval_scarebleu_bp": 0.9687585321862687, + "eval_scarebleu_counts": [ + 95554, + 32882, + 12777, + 5013 + ], + "eval_scarebleu_precisions": [ + 39.326679699557566, + 14.56373460891133, + 6.124826230765543, + 2.617221558011684 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.482855111003733, + "eval_scarebleu_sys_len": 242975, + "eval_scarebleu_totals": [ + 242975, + 225780, + 208610, + 191539 + ], + "eval_steps_per_second": 0.604, + "eval_ter_num_edits": 162649, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 74.48355764783463, + "step": 102000 + }, + { + "epoch": 40.15, + "learning_rate": 4.028266877220687e-05, + "loss": 2.2141, + "step": 102500 + }, + { + "epoch": 40.15, + "eval_bleu_bleu": 0.08041719237164284, + "eval_bleu_brevity_penalty": 0.9365804868471331, + "eval_bleu_length_ratio": 0.9385090587084888, + "eval_bleu_precisions": [ + 0.36801012400112687, + 0.13093900170516198, + 0.05283930005494738, + 0.02134663167916773 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 223627, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 30.22582013268319, + "eval_chrf_word_order": 2, + "eval_loss": 2.2742130756378174, + "eval_meteor": 0.2738874885701491, + "eval_runtime": 897.3887, + "eval_samples_per_second": 19.164, + "eval_scarebleu_bp": 0.9674619282749355, + "eval_scarebleu_counts": [ + 95600, + 32965, + 12835, + 5065 + ], + "eval_scarebleu_precisions": [ + 39.3966867221627, + 14.62089459561351, + 6.162022545272982, + 2.6486706967598885 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.526428392713418, + "eval_scarebleu_sys_len": 242660, + "eval_scarebleu_totals": [ + 242660, + 225465, + 208292, + 191228 + ], + "eval_steps_per_second": 0.6, + "eval_ter_num_edits": 162549, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 74.43776360197647, + "step": 102500 + }, + { + "epoch": 40.34, + "learning_rate": 4.0233320173707065e-05, + "loss": 2.2036, + "step": 103000 + }, + { + "epoch": 40.34, + "eval_bleu_bleu": 0.08145470581882554, + "eval_bleu_brevity_penalty": 0.9483321284115765, + "eval_bleu_length_ratio": 0.9496220816773614, + "eval_bleu_precisions": [ + 0.3674555297757154, + 0.13049550411325808, + 0.0526263684158421, + 0.0215684592732367 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 226275, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 30.43713614808498, + "eval_chrf_word_order": 2, + "eval_loss": 2.2722408771514893, + "eval_meteor": 0.27544084777889716, + "eval_runtime": 892.8324, + "eval_samples_per_second": 19.262, + "eval_scarebleu_bp": 0.9805461502997642, + "eval_scarebleu_counts": [ + 96624, + 33375, + 13015, + 5198 + ], + "eval_scarebleu_precisions": [ + 39.30089442236747, + 14.59577892260192, + 6.153984367981313, + 2.6737582815521996 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.664849587329662, + "eval_scarebleu_sys_len": 245857, + "eval_scarebleu_totals": [ + 245857, + 228662, + 211489, + 194408 + ], + "eval_steps_per_second": 0.603, + "eval_ter_num_edits": 162421, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 74.37914722327803, + "step": 103000 + }, + { + "epoch": 40.54, + "learning_rate": 4.0184168969601264e-05, + "loss": 2.22, + "step": 103500 + }, + { + "epoch": 40.54, + "eval_bleu_bleu": 0.0817695012084974, + "eval_bleu_brevity_penalty": 0.9435681728455223, + "eval_bleu_length_ratio": 0.945102170145082, + "eval_bleu_precisions": [ + 0.3688087816055205, + 0.1314452195401028, + 0.05346775376747501, + 0.02175876650461698 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 225198, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 30.487680414926594, + "eval_chrf_word_order": 2, + "eval_loss": 2.269068956375122, + "eval_meteor": 0.275992135472944, + "eval_runtime": 882.4869, + "eval_samples_per_second": 19.488, + "eval_scarebleu_bp": 0.9769897959263333, + "eval_scarebleu_counts": [ + 96587, + 33491, + 13126, + 5213 + ], + "eval_scarebleu_precisions": [ + 39.42584005486073, + 14.702641479614908, + 6.232165494713152, + 2.693500051668906 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.703381353047874, + "eval_scarebleu_sys_len": 244984, + "eval_scarebleu_totals": [ + 244984, + 227789, + 210617, + 193540 + ], + "eval_steps_per_second": 0.61, + "eval_ter_num_edits": 162203, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 74.27931620330725, + "step": 103500 + }, + { + "epoch": 40.74, + "learning_rate": 4.013482037110146e-05, + "loss": 2.2131, + "step": 104000 + }, + { + "epoch": 40.74, + "eval_bleu_bleu": 0.08123156030621156, + "eval_bleu_brevity_penalty": 0.94494604186325, + "eval_bleu_length_ratio": 0.946407362797393, + "eval_bleu_precisions": [ + 0.36892984315481864, + 0.13142659638814483, + 0.052962255761031626, + 0.021265598888193373 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 225509, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 30.467448704402315, + "eval_chrf_word_order": 2, + "eval_loss": 2.26434063911438, + "eval_meteor": 0.2767917048972901, + "eval_runtime": 883.7802, + "eval_samples_per_second": 19.46, + "eval_scarebleu_bp": 0.9738509308987449, + "eval_scarebleu_counts": [ + 96433, + 33361, + 12979, + 5085 + ], + "eval_scarebleu_precisions": [ + 39.48676581386969, + 14.69511631082587, + 6.1849234449532755, + 2.637749120750293 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.605955834688698, + "eval_scarebleu_sys_len": 244216, + "eval_scarebleu_totals": [ + 244216, + 227021, + 209849, + 192778 + ], + "eval_steps_per_second": 0.609, + "eval_ter_num_edits": 162249, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 74.300381464402, + "step": 104000 + }, + { + "epoch": 40.93, + "learning_rate": 4.0085471772601663e-05, + "loss": 2.2078, + "step": 104500 + }, + { + "epoch": 40.93, + "eval_bleu_bleu": 0.08137593193009969, + "eval_bleu_brevity_penalty": 0.9395350574720125, + "eval_bleu_length_ratio": 0.9412915112116469, + "eval_bleu_precisions": [ + 0.36869231798118507, + 0.13188633235954514, + 0.053212661106899165, + 0.02174969061195221 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 224290, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 30.498807128367055, + "eval_chrf_word_order": 2, + "eval_loss": 2.265319585800171, + "eval_meteor": 0.27522273008669085, + "eval_runtime": 904.9784, + "eval_samples_per_second": 19.004, + "eval_scarebleu_bp": 0.9691410279646165, + "eval_scarebleu_counts": [ + 96036, + 33284, + 12968, + 5173 + ], + "eval_scarebleu_precisions": [ + 39.50993137722777, + 14.735714317337619, + 6.213644334984811, + 2.699374337941003 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.634046166545005, + "eval_scarebleu_sys_len": 243068, + "eval_scarebleu_totals": [ + 243068, + 225873, + 208702, + 191637 + ], + "eval_steps_per_second": 0.594, + "eval_ter_num_edits": 162374, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 74.3576240217247, + "step": 104500 + }, + { + "epoch": 41.13, + "learning_rate": 4.003612317410186e-05, + "loss": 2.185, + "step": 105000 + }, + { + "epoch": 41.13, + "eval_bleu_bleu": 0.0819537525044089, + "eval_bleu_brevity_penalty": 0.9461186966524793, + "eval_bleu_length_ratio": 0.9475195044464683, + "eval_bleu_precisions": [ + 0.3680007441069388, + 0.13170069853628602, + 0.05339128708526411, + 0.021756333650637092 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 225774, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 30.57289550024335, + "eval_chrf_word_order": 2, + "eval_loss": 2.265334367752075, + "eval_meteor": 0.27627830487306926, + "eval_runtime": 904.3283, + "eval_samples_per_second": 19.017, + "eval_scarebleu_bp": 0.9758547017710176, + "eval_scarebleu_counts": [ + 96476, + 33515, + 13101, + 5232 + ], + "eval_scarebleu_precisions": [ + 39.42526950708197, + 14.73115585620036, + 6.228576047010274, + 2.707205762126026 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.70768201178772, + "eval_scarebleu_sys_len": 244706, + "eval_scarebleu_totals": [ + 244706, + 227511, + 210337, + 193262 + ], + "eval_steps_per_second": 0.595, + "eval_ter_num_edits": 162225, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 74.28939089339605, + "step": 105000 + }, + { + "epoch": 41.32, + "learning_rate": 3.9986774575602056e-05, + "loss": 2.192, + "step": 105500 + }, + { + "epoch": 41.32, + "eval_bleu_bleu": 0.08164186865974944, + "eval_bleu_brevity_penalty": 0.9395306072687831, + "eval_bleu_length_ratio": 0.9412873144507069, + "eval_bleu_precisions": [ + 0.36983534636116794, + 0.1324857311172704, + 0.053655197830836866, + 0.021687959423273784 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 224289, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 30.538732520453916, + "eval_chrf_word_order": 2, + "eval_loss": 2.2652299404144287, + "eval_meteor": 0.27670567092085413, + "eval_runtime": 885.656, + "eval_samples_per_second": 19.418, + "eval_scarebleu_bp": 0.9705135542755867, + "eval_scarebleu_counts": [ + 96387, + 33517, + 13131, + 5211 + ], + "eval_scarebleu_precisions": [ + 39.59992111815022, + 14.816959687365996, + 6.28169310549379, + 2.714613905949646 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.706466417439938, + "eval_scarebleu_sys_len": 243402, + "eval_scarebleu_totals": [ + 243402, + 226207, + 209036, + 191961 + ], + "eval_steps_per_second": 0.607, + "eval_ter_num_edits": 162055, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 74.21154101543718, + "step": 105500 + }, + { + "epoch": 41.52, + "learning_rate": 3.993742597710225e-05, + "loss": 2.1939, + "step": 106000 + }, + { + "epoch": 41.52, + "eval_bleu_bleu": 0.0820386334955823, + "eval_bleu_brevity_penalty": 0.9447866374930116, + "eval_bleu_length_ratio": 0.9462562794035564, + "eval_bleu_precisions": [ + 0.36958305429031413, + 0.1324431769077867, + 0.053506490788365245, + 0.021706539533013585 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 225473, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 30.623776295472233, + "eval_chrf_word_order": 2, + "eval_loss": 2.2545361518859863, + "eval_meteor": 0.2770948173760698, + "eval_runtime": 888.1507, + "eval_samples_per_second": 19.364, + "eval_scarebleu_bp": 0.9749187327522213, + "eval_scarebleu_counts": [ + 96733, + 33668, + 13153, + 5181 + ], + "eval_scarebleu_precisions": [ + 39.56732126130474, + 14.813315616722837, + 6.260084051611306, + 2.683941420556681 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.71189427346959, + "eval_scarebleu_sys_len": 244477, + "eval_scarebleu_totals": [ + 244477, + 227282, + 210109, + 193037 + ], + "eval_steps_per_second": 0.606, + "eval_ter_num_edits": 162043, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 74.20604572993419, + "step": 106000 + }, + { + "epoch": 41.72, + "learning_rate": 3.988807737860245e-05, + "loss": 2.1968, + "step": 106500 + }, + { + "epoch": 41.72, + "eval_bleu_bleu": 0.08276218337930524, + "eval_bleu_brevity_penalty": 0.9473739860838443, + "eval_bleu_length_ratio": 0.9487113845534016, + "eval_bleu_precisions": [ + 0.3694096205398614, + 0.13292924069844828, + 0.0540674473800892, + 0.02193700553004889 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 226058, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 30.71766289742337, + "eval_chrf_word_order": 2, + "eval_loss": 2.2563352584838867, + "eval_meteor": 0.27758866058910936, + "eval_runtime": 892.4818, + "eval_samples_per_second": 19.27, + "eval_scarebleu_bp": 0.9759854241709304, + "eval_scarebleu_counts": [ + 96812, + 33801, + 13315, + 5288 + ], + "eval_scarebleu_precisions": [ + 39.55740424453906, + 14.854774701924471, + 6.32923426485338, + 2.7356016202542124 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.802070034886079, + "eval_scarebleu_sys_len": 244738, + "eval_scarebleu_totals": [ + 244738, + 227543, + 210373, + 193303 + ], + "eval_steps_per_second": 0.603, + "eval_ter_num_edits": 162027, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 74.19871868259689, + "step": 106500 + }, + { + "epoch": 41.91, + "learning_rate": 3.9838728780102645e-05, + "loss": 2.1935, + "step": 107000 + }, + { + "epoch": 41.91, + "eval_bleu_bleu": 0.08323670346540714, + "eval_bleu_brevity_penalty": 0.9439006203980763, + "eval_bleu_length_ratio": 0.945416927215575, + "eval_bleu_precisions": [ + 0.370213030411989, + 0.13336345024461982, + 0.054541169076052796, + 0.022456467232535138 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 225273, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 30.711571545231507, + "eval_chrf_word_order": 2, + "eval_loss": 2.2553675174713135, + "eval_meteor": 0.27784869163613257, + "eval_runtime": 892.1976, + "eval_samples_per_second": 19.276, + "eval_scarebleu_bp": 0.9741906205518825, + "eval_scarebleu_counts": [ + 96821, + 33838, + 13346, + 5370 + ], + "eval_scarebleu_precisions": [ + 39.63217205146153, + 14.89978159785825, + 6.357266365935798, + 2.784388756669311 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.85033403592959, + "eval_scarebleu_sys_len": 244299, + "eval_scarebleu_totals": [ + 244299, + 227104, + 209933, + 192861 + ], + "eval_steps_per_second": 0.603, + "eval_ter_num_edits": 162023, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 74.19688692076257, + "step": 107000 + }, + { + "epoch": 42.11, + "learning_rate": 3.978947887879985e-05, + "loss": 2.1812, + "step": 107500 + }, + { + "epoch": 42.11, + "eval_bleu_bleu": 0.08271867700515136, + "eval_bleu_brevity_penalty": 0.9454373875747651, + "eval_bleu_length_ratio": 0.9468732032617226, + "eval_bleu_precisions": [ + 0.3699184469461927, + 0.13284394866258847, + 0.05395104200432905, + 0.022102206203080878 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 225620, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 30.721263260811998, + "eval_chrf_word_order": 2, + "eval_loss": 2.2525553703308105, + "eval_meteor": 0.2778050723988427, + "eval_runtime": 892.2641, + "eval_samples_per_second": 19.275, + "eval_scarebleu_bp": 0.9733145654887002, + "eval_scarebleu_counts": [ + 96672, + 33716, + 13228, + 5254 + ], + "eval_scarebleu_precisions": [ + 39.60587500256058, + 14.860064348362643, + 6.307517714263916, + 2.727338794240093 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.763323744482513, + "eval_scarebleu_sys_len": 244085, + "eval_scarebleu_totals": [ + 244085, + 226890, + 209718, + 192642 + ], + "eval_steps_per_second": 0.603, + "eval_ter_num_edits": 161945, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 74.1611675649932, + "step": 107500 + }, + { + "epoch": 42.3, + "learning_rate": 3.974013028030004e-05, + "loss": 2.1686, + "step": 108000 + }, + { + "epoch": 42.3, + "eval_bleu_bleu": 0.08378795607428229, + "eval_bleu_brevity_penalty": 0.9524110251976367, + "eval_bleu_length_ratio": 0.9535082823077149, + "eval_bleu_precisions": [ + 0.36931175478981165, + 0.13326285915640507, + 0.05451990438015629, + 0.022323967694232737 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 227201, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 30.967777293865307, + "eval_chrf_word_order": 2, + "eval_loss": 2.251058578491211, + "eval_meteor": 0.2795046094731588, + "eval_runtime": 899.7122, + "eval_samples_per_second": 19.115, + "eval_scarebleu_bp": 0.9820984205362882, + "eval_scarebleu_counts": [ + 97268, + 34084, + 13491, + 5411 + ], + "eval_scarebleu_precisions": [ + 39.50145996369381, + 14.88098356647631, + 6.36752378794744, + 2.777749258205936 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.917041092373575, + "eval_scarebleu_sys_len": 246239, + "eval_scarebleu_totals": [ + 246239, + 229044, + 211872, + 194798 + ], + "eval_steps_per_second": 0.598, + "eval_ter_num_edits": 161880, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 74.1314014351854, + "step": 108000 + }, + { + "epoch": 42.5, + "learning_rate": 3.9690781681800236e-05, + "loss": 2.1781, + "step": 108500 + }, + { + "epoch": 42.5, + "eval_bleu_bleu": 0.08301625625387049, + "eval_bleu_brevity_penalty": 0.9436568357235952, + "eval_bleu_length_ratio": 0.9451861053638801, + "eval_bleu_precisions": [ + 0.3709472599881004, + 0.1338938482763925, + 0.0543793191975396, + 0.022176329141594855 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 225218, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 30.792013010018437, + "eval_chrf_word_order": 2, + "eval_loss": 2.244746208190918, + "eval_meteor": 0.2787500907442323, + "eval_runtime": 881.0959, + "eval_samples_per_second": 19.519, + "eval_scarebleu_bp": 0.9741906205518825, + "eval_scarebleu_counts": [ + 96986, + 33968, + 13334, + 5285 + ], + "eval_scarebleu_precisions": [ + 39.69971223787244, + 14.957024094687897, + 6.351641023198209, + 2.7403581910006327 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.82257608270538, + "eval_scarebleu_sys_len": 244299, + "eval_scarebleu_totals": [ + 244299, + 227104, + 209930, + 192858 + ], + "eval_steps_per_second": 0.611, + "eval_ter_num_edits": 161640, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 74.02149572512582, + "step": 108500 + }, + { + "epoch": 42.69, + "learning_rate": 3.964143308330044e-05, + "loss": 2.1821, + "step": 109000 + }, + { + "epoch": 42.69, + "eval_bleu_bleu": 0.08286178501673322, + "eval_bleu_brevity_penalty": 0.9405714478084503, + "eval_bleu_length_ratio": 0.942269356510645, + "eval_bleu_precisions": [ + 0.3708528747611603, + 0.13379765395894427, + 0.05459325866330126, + 0.02223621210458528 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 224523, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 30.74308895221285, + "eval_chrf_word_order": 2, + "eval_loss": 2.246273994445801, + "eval_meteor": 0.2777618402593727, + "eval_runtime": 894.0905, + "eval_samples_per_second": 19.235, + "eval_scarebleu_bp": 0.9714043068341303, + "eval_scarebleu_counts": [ + 96702, + 33829, + 13354, + 5336 + ], + "eval_scarebleu_precisions": [ + 39.69394833736285, + 14.940554004875809, + 6.381748409819692, + 2.776578086055188 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.83524465744469, + "eval_scarebleu_sys_len": 243619, + "eval_scarebleu_totals": [ + 243619, + 226424, + 209253, + 192179 + ], + "eval_steps_per_second": 0.602, + "eval_ter_num_edits": 161817, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 74.10255118629476, + "step": 109000 + }, + { + "epoch": 42.89, + "learning_rate": 3.9592183181997636e-05, + "loss": 2.1834, + "step": 109500 + }, + { + "epoch": 42.89, + "eval_bleu_bleu": 0.08376967673164924, + "eval_bleu_brevity_penalty": 0.9445341981402636, + "eval_bleu_length_ratio": 0.9460170640299816, + "eval_bleu_precisions": [ + 0.3709630194839763, + 0.13416994443403885, + 0.05504524732938695, + 0.02258244315602572 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 225416, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 30.874886756592602, + "eval_chrf_word_order": 2, + "eval_loss": 2.243274211883545, + "eval_meteor": 0.2792540260767041, + "eval_runtime": 888.2997, + "eval_samples_per_second": 19.361, + "eval_scarebleu_bp": 0.9748573949152397, + "eval_scarebleu_counts": [ + 97054, + 34018, + 13456, + 5387 + ], + "eval_scarebleu_precisions": [ + 39.70105783311926, + 14.968297201089467, + 6.404752158557598, + 2.7909024971505545 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.896837916858805, + "eval_scarebleu_sys_len": 244462, + "eval_scarebleu_totals": [ + 244462, + 227267, + 210094, + 193020 + ], + "eval_steps_per_second": 0.606, + "eval_ter_num_edits": 161633, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 74.01829014191574, + "step": 109500 + }, + { + "epoch": 43.09, + "learning_rate": 3.9542834583497826e-05, + "loss": 2.1618, + "step": 110000 + }, + { + "epoch": 43.09, + "eval_bleu_bleu": 0.08398075656784036, + "eval_bleu_brevity_penalty": 0.9444278898778491, + "eval_bleu_length_ratio": 0.9459163417674239, + "eval_bleu_precisions": [ + 0.371943103570668, + 0.1345840718165968, + 0.055204254695450074, + 0.022625656586554486 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 225392, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 30.911072516206584, + "eval_chrf_word_order": 2, + "eval_loss": 2.2393362522125244, + "eval_meteor": 0.28074976894792786, + "eval_runtime": 890.6467, + "eval_samples_per_second": 19.31, + "eval_scarebleu_bp": 0.975907809757291, + "eval_scarebleu_counts": [ + 97374, + 34178, + 13504, + 5421 + ], + "eval_scarebleu_precisions": [ + 39.790126635038554, + 15.021711995218087, + 6.41974604351774, + 2.8048117966627863 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.940034116957532, + "eval_scarebleu_sys_len": 244719, + "eval_scarebleu_totals": [ + 244719, + 227524, + 210351, + 193275 + ], + "eval_steps_per_second": 0.604, + "eval_ter_num_edits": 161449, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.93402909753674, + "step": 110000 + }, + { + "epoch": 43.28, + "learning_rate": 3.949348598499803e-05, + "loss": 2.1489, + "step": 110500 + }, + { + "epoch": 43.28, + "eval_bleu_bleu": 0.08368726198087074, + "eval_bleu_brevity_penalty": 0.9466227596539202, + "eval_bleu_length_ratio": 0.9479979351936175, + "eval_bleu_precisions": [ + 0.37167977050573736, + 0.1343312904601496, + 0.05468480791922061, + 0.02237262104653895 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 225888, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 30.96599563815333, + "eval_chrf_word_order": 2, + "eval_loss": 2.2402048110961914, + "eval_meteor": 0.2804123485073307, + "eval_runtime": 882.5914, + "eval_samples_per_second": 19.486, + "eval_scarebleu_bp": 0.9774304285582827, + "eval_scarebleu_counts": [ + 97437, + 34203, + 13445, + 5361 + ], + "eval_scarebleu_precisions": [ + 39.75527556999005, + 15.008095762559401, + 6.380353541345356, + 2.7684251838387177 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.903422992429224, + "eval_scarebleu_sys_len": 245092, + "eval_scarebleu_totals": [ + 245092, + 227897, + 210725, + 193648 + ], + "eval_steps_per_second": 0.61, + "eval_ter_num_edits": 161549, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.9798231433949, + "step": 110500 + }, + { + "epoch": 43.48, + "learning_rate": 3.944423608369523e-05, + "loss": 2.1629, + "step": 111000 + }, + { + "epoch": 43.48, + "eval_bleu_bleu": 0.08463814276133515, + "eval_bleu_brevity_penalty": 0.9501048227128521, + "eval_bleu_length_ratio": 0.9513091795752039, + "eval_bleu_precisions": [ + 0.37125072239353796, + 0.13487555016660144, + 0.055184642103183267, + 0.02279080381082777 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 226677, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 31.113073636659234, + "eval_chrf_word_order": 2, + "eval_loss": 2.2400150299072266, + "eval_meteor": 0.2814228778365361, + "eval_runtime": 897.8651, + "eval_samples_per_second": 19.154, + "eval_scarebleu_bp": 0.9781521663246732, + "eval_scarebleu_counts": [ + 97484, + 34331, + 13571, + 5453 + ], + "eval_scarebleu_precisions": [ + 39.74574854547456, + 15.052570656892062, + 6.434772713263569, + 2.813333539702931 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.978617341617054, + "eval_scarebleu_sys_len": 245269, + "eval_scarebleu_totals": [ + 245269, + 228074, + 210901, + 193827 + ], + "eval_steps_per_second": 0.599, + "eval_ter_num_edits": 161499, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.95692612046581, + "step": 111000 + }, + { + "epoch": 43.67, + "learning_rate": 3.939488748519542e-05, + "loss": 2.155, + "step": 111500 + }, + { + "epoch": 43.67, + "eval_bleu_bleu": 0.08404341929801172, + "eval_bleu_brevity_penalty": 0.9443260011110467, + "eval_bleu_length_ratio": 0.945819816265806, + "eval_bleu_precisions": [ + 0.37292174167698305, + 0.13495441313516576, + 0.055230397135348504, + 0.022570651830309162 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 225369, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 31.000618852238134, + "eval_chrf_word_order": 2, + "eval_loss": 2.233893632888794, + "eval_meteor": 0.2807980961795671, + "eval_runtime": 914.817, + "eval_samples_per_second": 18.799, + "eval_scarebleu_bp": 0.973494749995395, + "eval_scarebleu_counts": [ + 97416, + 34172, + 13537, + 5430 + ], + "eval_scarebleu_precisions": [ + 39.90349364475339, + 15.058122625961733, + 6.453442916801739, + 2.8179539474708473 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.953146406235733, + "eval_scarebleu_sys_len": 244129, + "eval_scarebleu_totals": [ + 244129, + 226934, + 209764, + 192693 + ], + "eval_steps_per_second": 0.588, + "eval_ter_num_edits": 161285, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.85892686232935, + "step": 111500 + }, + { + "epoch": 43.87, + "learning_rate": 3.934553888669562e-05, + "loss": 2.164, + "step": 112000 + }, + { + "epoch": 43.87, + "eval_bleu_bleu": 0.08414308820647008, + "eval_bleu_brevity_penalty": 0.9484512834233482, + "eval_bleu_length_ratio": 0.9497353942227389, + "eval_bleu_precisions": [ + 0.37157426801353943, + 0.13439052733767878, + 0.055071920145455304, + 0.022525226538604465 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 226302, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 31.017974282217075, + "eval_chrf_word_order": 2, + "eval_loss": 2.2290892601013184, + "eval_meteor": 0.28068148935882187, + "eval_runtime": 897.155, + "eval_samples_per_second": 19.169, + "eval_scarebleu_bp": 0.9805542835280067, + "eval_scarebleu_counts": [ + 97710, + 34303, + 13565, + 5411 + ], + "eval_scarebleu_precisions": [ + 39.74229131331373, + 15.001486897806389, + 6.41389353835097, + 2.7832214592495435 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.959460681172338, + "eval_scarebleu_sys_len": 245859, + "eval_scarebleu_totals": [ + 245859, + 228664, + 211494, + 194415 + ], + "eval_steps_per_second": 0.6, + "eval_ter_num_edits": 161476, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.94639348991844, + "step": 112000 + }, + { + "epoch": 44.07, + "learning_rate": 3.9296190288195816e-05, + "loss": 2.1514, + "step": 112500 + }, + { + "epoch": 44.07, + "eval_bleu_bleu": 0.08464313720540276, + "eval_bleu_brevity_penalty": 0.9468570228726237, + "eval_bleu_length_ratio": 0.9482203635234326, + "eval_bleu_precisions": [ + 0.3713447315892202, + 0.13500617975913312, + 0.055682856173500016, + 0.022875835715636117 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 225941, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 31.12594167993675, + "eval_chrf_word_order": 2, + "eval_loss": 2.2338244915008545, + "eval_meteor": 0.2806436775275996, + "eval_runtime": 900.3613, + "eval_samples_per_second": 19.101, + "eval_scarebleu_bp": 0.975907809757291, + "eval_scarebleu_counts": [ + 97297, + 34284, + 13632, + 5458 + ], + "eval_scarebleu_precisions": [ + 39.75866197557198, + 15.068300486981594, + 6.480565908572298, + 2.8239701149663174 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.986218371908116, + "eval_scarebleu_sys_len": 244719, + "eval_scarebleu_totals": [ + 244719, + 227524, + 210352, + 193274 + ], + "eval_steps_per_second": 0.598, + "eval_ter_num_edits": 161485, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.95051495404567, + "step": 112500 + }, + { + "epoch": 44.26, + "learning_rate": 3.924684168969601e-05, + "loss": 2.1329, + "step": 113000 + }, + { + "epoch": 44.26, + "eval_bleu_bleu": 0.08496539154951828, + "eval_bleu_brevity_penalty": 0.9474932493483653, + "eval_bleu_length_ratio": 0.9488246970987791, + "eval_bleu_precisions": [ + 0.37284649578698276, + 0.13541576906505817, + 0.05572970181871287, + 0.022981466005746798 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 226085, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 31.048458456203537, + "eval_chrf_word_order": 2, + "eval_loss": 2.2276077270507812, + "eval_meteor": 0.2816138123742026, + "eval_runtime": 890.4604, + "eval_samples_per_second": 19.314, + "eval_scarebleu_bp": 0.9721958959332213, + "eval_scarebleu_counts": [ + 97360, + 34248, + 13568, + 5446 + ], + "eval_scarebleu_precisions": [ + 39.93240693649205, + 15.112723229060485, + 6.478134862468548, + 2.8310763392509033 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 9.97174648904625, + "eval_scarebleu_sys_len": 243812, + "eval_scarebleu_totals": [ + 243812, + 226617, + 209443, + 192365 + ], + "eval_steps_per_second": 0.604, + "eval_ter_num_edits": 161126, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.78611432941489, + "step": 113000 + }, + { + "epoch": 44.46, + "learning_rate": 3.9197493091196215e-05, + "loss": 2.1429, + "step": 113500 + }, + { + "epoch": 44.46, + "eval_bleu_bleu": 0.08493542457765622, + "eval_bleu_brevity_penalty": 0.948883658877927, + "eval_bleu_length_ratio": 0.9501466767948498, + "eval_bleu_precisions": [ + 0.3714001766784452, + 0.13526923352692335, + 0.055836453294314296, + 0.02288466812945694 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 226400, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 31.286450035359465, + "eval_chrf_word_order": 2, + "eval_loss": 2.2315003871917725, + "eval_meteor": 0.28152092562502634, + "eval_runtime": 887.2773, + "eval_samples_per_second": 19.383, + "eval_scarebleu_bp": 0.9802207679773393, + "eval_scarebleu_counts": [ + 97623, + 34522, + 13747, + 5541 + ], + "eval_scarebleu_precisions": [ + 39.720152821460104, + 15.10267650121182, + 6.50253062769027, + 2.851364702976411 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.066393455913706, + "eval_scarebleu_sys_len": 245777, + "eval_scarebleu_totals": [ + 245777, + 228582, + 211410, + 194328 + ], + "eval_steps_per_second": 0.606, + "eval_ter_num_edits": 161395, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.90930031277333, + "step": 113500 + }, + { + "epoch": 44.65, + "learning_rate": 3.914814449269641e-05, + "loss": 2.1472, + "step": 114000 + }, + { + "epoch": 44.65, + "eval_bleu_bleu": 0.08531808972500356, + "eval_bleu_brevity_penalty": 0.9495407063539616, + "eval_bleu_length_ratio": 0.9507719941748958, + "eval_bleu_precisions": [ + 0.37286856265090557, + 0.13589900360155527, + 0.05599059278953968, + 0.022973281571134964 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 226549, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 31.252819151864227, + "eval_chrf_word_order": 2, + "eval_loss": 2.2226319313049316, + "eval_meteor": 0.2823922755056947, + "eval_runtime": 888.0265, + "eval_samples_per_second": 19.367, + "eval_scarebleu_bp": 0.9793620740370291, + "eval_scarebleu_counts": [ + 97976, + 34634, + 13744, + 5527 + ], + "eval_scarebleu_precisions": [ + 39.898031486443564, + 15.165673399862504, + 6.5076373829297625, + 2.847251915082141 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.077641007558917, + "eval_scarebleu_sys_len": 245566, + "eval_scarebleu_totals": [ + 245566, + 228371, + 211198, + 194117 + ], + "eval_steps_per_second": 0.606, + "eval_ter_num_edits": 161102, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.77512375840894, + "step": 114000 + }, + { + "epoch": 44.85, + "learning_rate": 3.909879589419661e-05, + "loss": 2.1497, + "step": 114500 + }, + { + "epoch": 44.85, + "eval_bleu_bleu": 0.08497767509237251, + "eval_bleu_brevity_penalty": 0.9485527752216263, + "eval_bleu_length_ratio": 0.9498319197243568, + "eval_bleu_precisions": [ + 0.37247321329945876, + 0.13594414957203654, + 0.055675655965286064, + 0.022848225361130008 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 226325, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 31.274545655531906, + "eval_chrf_word_order": 2, + "eval_loss": 2.2216646671295166, + "eval_meteor": 0.2820542427658562, + "eval_runtime": 910.7431, + "eval_samples_per_second": 18.883, + "eval_scarebleu_bp": 0.9776629081878023, + "eval_scarebleu_counts": [ + 97734, + 34573, + 13671, + 5456 + ], + "eval_scarebleu_precisions": [ + 39.86718281534903, + 15.166656430683384, + 6.485847937679688, + 2.816683272845542 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.022860413335518, + "eval_scarebleu_sys_len": 245149, + "eval_scarebleu_totals": [ + 245149, + 227954, + 210782, + 193703 + ], + "eval_steps_per_second": 0.591, + "eval_ter_num_edits": 161112, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.77970316299475, + "step": 114500 + }, + { + "epoch": 45.05, + "learning_rate": 3.9049545992893805e-05, + "loss": 2.1364, + "step": 115000 + }, + { + "epoch": 45.05, + "eval_bleu_bleu": 0.08534906214010006, + "eval_bleu_brevity_penalty": 0.9502942627415651, + "eval_bleu_length_ratio": 0.9514896402956199, + "eval_bleu_precisions": [ + 0.3733592095977417, + 0.1360553633217993, + 0.05590933901697294, + 0.02291055927544002 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 226720, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 31.303413555173293, + "eval_chrf_word_order": 2, + "eval_loss": 2.2223477363586426, + "eval_meteor": 0.2834077369922771, + "eval_runtime": 880.6541, + "eval_samples_per_second": 19.529, + "eval_scarebleu_bp": 0.978209231194136, + "eval_scarebleu_counts": [ + 98077, + 34657, + 13770, + 5542 + ], + "eval_scarebleu_precisions": [ + 39.985241537326274, + 15.19457402406089, + 6.52866544027006, + 2.8590442682404653 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.094623915859636, + "eval_scarebleu_sys_len": 245283, + "eval_scarebleu_totals": [ + 245283, + 228088, + 210916, + 193841 + ], + "eval_steps_per_second": 0.611, + "eval_ter_num_edits": 160812, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.64232102542027, + "step": 115000 + }, + { + "epoch": 45.24, + "learning_rate": 3.9000197394394e-05, + "loss": 2.1179, + "step": 115500 + }, + { + "epoch": 45.24, + "eval_bleu_bleu": 0.08549730768655792, + "eval_bleu_brevity_penalty": 0.9452028095260888, + "eval_bleu_length_ratio": 0.9466507749319075, + "eval_bleu_precisions": [ + 0.3744829695833167, + 0.1368082083965216, + 0.056251993870645514, + 0.023228843724882306 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 225567, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 31.327460359303906, + "eval_chrf_word_order": 2, + "eval_loss": 2.219003200531006, + "eval_meteor": 0.2830799530551107, + "eval_runtime": 881.7346, + "eval_samples_per_second": 19.505, + "eval_scarebleu_bp": 0.9761038769418444, + "eval_scarebleu_counts": [ + 98057, + 34707, + 13745, + 5543 + ], + "eval_scarebleu_precisions": [ + 40.061364481323054, + 15.250997486509764, + 6.532825726358015, + 2.8672518764128054 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.095870332371604, + "eval_scarebleu_sys_len": 244767, + "eval_scarebleu_totals": [ + 244767, + 227572, + 210399, + 193321 + ], + "eval_steps_per_second": 0.61, + "eval_ter_num_edits": 160775, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.62537722845276, + "step": 115500 + }, + { + "epoch": 45.44, + "learning_rate": 3.89508487958942e-05, + "loss": 2.1258, + "step": 116000 + }, + { + "epoch": 45.44, + "eval_bleu_bleu": 0.08614802991945111, + "eval_bleu_brevity_penalty": 0.9481688200453937, + "eval_bleu_length_ratio": 0.9494668015225849, + "eval_bleu_precisions": [ + 0.373089401426816, + 0.13653650205938492, + 0.05664939910986961, + 0.02361466179389073 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 226238, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 31.364486927949102, + "eval_chrf_word_order": 2, + "eval_loss": 2.219782829284668, + "eval_meteor": 0.28316095440746, + "eval_runtime": 894.0393, + "eval_samples_per_second": 19.236, + "eval_scarebleu_bp": 0.9768877705863861, + "eval_scarebleu_counts": [ + 97845, + 34670, + 13839, + 5635 + ], + "eval_scarebleu_precisions": [ + 39.94341910278863, + 15.22189634885232, + 6.571443495272872, + 2.91194906802127 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.145753588418941, + "eval_scarebleu_sys_len": 244959, + "eval_scarebleu_totals": [ + 244959, + 227764, + 210593, + 193513 + ], + "eval_steps_per_second": 0.602, + "eval_ter_num_edits": 161037, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.74535762860113, + "step": 116000 + }, + { + "epoch": 45.63, + "learning_rate": 3.8901500197394395e-05, + "loss": 2.1259, + "step": 116500 + }, + { + "epoch": 45.63, + "eval_bleu_bleu": 0.0858393462365002, + "eval_bleu_brevity_penalty": 0.9505585406886313, + "eval_bleu_length_ratio": 0.9517414459520143, + "eval_bleu_precisions": [ + 0.3727753770173737, + 0.13616432473698023, + 0.05634461576838527, + 0.023252366290340973 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 226780, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 31.353064363967142, + "eval_chrf_word_order": 2, + "eval_loss": 2.218111276626587, + "eval_meteor": 0.28276316619119407, + "eval_runtime": 891.7044, + "eval_samples_per_second": 19.287, + "eval_scarebleu_bp": 0.9778137877415032, + "eval_scarebleu_counts": [ + 97867, + 34648, + 13802, + 5578 + ], + "eval_scarebleu_precisions": [ + 39.91541115724389, + 15.197091113245698, + 6.546879298731607, + 2.8791757856051534 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.11130135528795, + "eval_scarebleu_sys_len": 245186, + "eval_scarebleu_totals": [ + 245186, + 227991, + 210818, + 193736 + ], + "eval_steps_per_second": 0.603, + "eval_ter_num_edits": 161196, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.8181701615156, + "step": 116500 + }, + { + "epoch": 45.83, + "learning_rate": 3.885225029609159e-05, + "loss": 2.1309, + "step": 117000 + }, + { + "epoch": 45.83, + "eval_bleu_bleu": 0.0857966897477264, + "eval_bleu_brevity_penalty": 0.9493114477398834, + "eval_bleu_length_ratio": 0.9505537626060206, + "eval_bleu_precisions": [ + 0.3739078221786602, + 0.1365156568021328, + 0.05631772335043874, + 0.02320893178378687 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 226497, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 31.353109895632443, + "eval_chrf_word_order": 2, + "eval_loss": 2.212167978286743, + "eval_meteor": 0.2834761654848561, + "eval_runtime": 888.9141, + "eval_samples_per_second": 19.347, + "eval_scarebleu_bp": 0.9777077665963022, + "eval_scarebleu_counts": [ + 98041, + 34757, + 13807, + 5570 + ], + "eval_scarebleu_precisions": [ + 39.99061837167564, + 15.246638738402824, + 6.550027752344717, + 2.8753432860476162 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.121044471247147, + "eval_scarebleu_sys_len": 245160, + "eval_scarebleu_totals": [ + 245160, + 227965, + 210793, + 193716 + ], + "eval_steps_per_second": 0.605, + "eval_ter_num_edits": 160984, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.7210867842963, + "step": 117000 + }, + { + "epoch": 46.02, + "learning_rate": 3.880300039478879e-05, + "loss": 2.1316, + "step": 117500 + }, + { + "epoch": 46.02, + "eval_bleu_bleu": 0.086212437990534, + "eval_bleu_brevity_penalty": 0.9473960728901846, + "eval_bleu_length_ratio": 0.9487323683581013, + "eval_bleu_precisions": [ + 0.3741479145194039, + 0.13711530727540838, + 0.05680976474883939, + 0.02352887296126037 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 226063, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 31.439721123467123, + "eval_chrf_word_order": 2, + "eval_loss": 2.2119810581207275, + "eval_meteor": 0.28362319734163144, + "eval_runtime": 885.417, + "eval_samples_per_second": 19.424, + "eval_scarebleu_bp": 0.9783111248243889, + "eval_scarebleu_counts": [ + 98147, + 34911, + 13949, + 5671 + ], + "eval_scarebleu_precisions": [ + 40.00970208880265, + 15.304257100647487, + 6.612655491504855, + 2.925186209173252 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.205957098013107, + "eval_scarebleu_sys_len": 245308, + "eval_scarebleu_totals": [ + 245308, + 228113, + 210944, + 193868 + ], + "eval_steps_per_second": 0.608, + "eval_ter_num_edits": 160726, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.60293814598225, + "step": 117500 + }, + { + "epoch": 46.22, + "learning_rate": 3.8753651796288986e-05, + "loss": 2.108, + "step": 118000 + }, + { + "epoch": 46.22, + "eval_bleu_bleu": 0.08649505168173684, + "eval_bleu_brevity_penalty": 0.9495539312901542, + "eval_bleu_length_ratio": 0.9507845844577155, + "eval_bleu_precisions": [ + 0.37515007592075994, + 0.1371485070955354, + 0.0568213154074683, + 0.02354935945742276 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 226552, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 31.46903162936241, + "eval_chrf_word_order": 2, + "eval_loss": 2.209543466567993, + "eval_meteor": 0.2844484193592734, + "eval_runtime": 884.3214, + "eval_samples_per_second": 19.448, + "eval_scarebleu_bp": 0.9797569187922502, + "eval_scarebleu_counts": [ + 98585, + 34959, + 13917, + 5630 + ], + "eval_scarebleu_precisions": [ + 40.13017833373361, + 15.30148642260623, + 6.586401260772649, + 2.898759660386879 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.19493862022322, + "eval_scarebleu_sys_len": 245663, + "eval_scarebleu_totals": [ + 245663, + 228468, + 211299, + 194221 + ], + "eval_steps_per_second": 0.608, + "eval_ter_num_edits": 160538, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.51684533976892, + "step": 118000 + }, + { + "epoch": 46.42, + "learning_rate": 3.870430319778918e-05, + "loss": 2.1012, + "step": 118500 + }, + { + "epoch": 46.42, + "eval_bleu_bleu": 0.08660782617658401, + "eval_bleu_brevity_penalty": 0.9529164807791017, + "eval_bleu_length_ratio": 0.9539909098158041, + "eval_bleu_precisions": [ + 0.37267944183427476, + 0.13684496076070454, + 0.056855459336764044, + 0.023532755435554924 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 227316, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 31.537688132202064, + "eval_chrf_word_order": 2, + "eval_loss": 2.2145776748657227, + "eval_meteor": 0.2835471503650807, + "eval_runtime": 893.5619, + "eval_samples_per_second": 19.247, + "eval_scarebleu_bp": 0.9832184856054086, + "eval_scarebleu_counts": [ + 98241, + 35008, + 14041, + 5691 + ], + "eval_scarebleu_precisions": [ + 39.85193598766809, + 15.26600383743241, + 6.618461552965133, + 2.917459129427325 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.2360922400412, + "eval_scarebleu_sys_len": 246515, + "eval_scarebleu_totals": [ + 246515, + 229320, + 212149, + 195067 + ], + "eval_steps_per_second": 0.602, + "eval_ter_num_edits": 160875, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.67117127431091, + "step": 118500 + }, + { + "epoch": 46.61, + "learning_rate": 3.8654954599289386e-05, + "loss": 2.1132, + "step": 119000 + }, + { + "epoch": 46.61, + "eval_bleu_bleu": 0.08633734947413302, + "eval_bleu_brevity_penalty": 0.9420109315175664, + "eval_bleu_length_ratio": 0.9436291070551748, + "eval_bleu_precisions": [ + 0.37706084581960175, + 0.13833721803787105, + 0.057219649962728485, + 0.023641520528518558 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 224847, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 31.42141994672048, + "eval_chrf_word_order": 2, + "eval_loss": 2.20444655418396, + "eval_meteor": 0.28471214857908006, + "eval_runtime": 884.7797, + "eval_samples_per_second": 19.438, + "eval_scarebleu_bp": 0.9706819121785947, + "eval_scarebleu_counts": [ + 98182, + 34945, + 13910, + 5615 + ], + "eval_scarebleu_precisions": [ + 40.33059073376519, + 15.44544040168311, + 6.653019447287615, + 2.924448703659337 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.184773076102429, + "eval_scarebleu_sys_len": 243443, + "eval_scarebleu_totals": [ + 243443, + 226248, + 209078, + 192002 + ], + "eval_steps_per_second": 0.608, + "eval_ter_num_edits": 160276, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.39686493962056, + "step": 119000 + }, + { + "epoch": 46.81, + "learning_rate": 3.860560600078958e-05, + "loss": 2.1167, + "step": 119500 + }, + { + "epoch": 46.81, + "eval_bleu_bleu": 0.08644178813517502, + "eval_bleu_brevity_penalty": 0.9506378111304641, + "eval_bleu_length_ratio": 0.9518169876489325, + "eval_bleu_precisions": [ + 0.3739539149375215, + 0.13693983387642353, + 0.05672819105817797, + 0.02353357011327811 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 226798, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 31.558523283489404, + "eval_chrf_word_order": 2, + "eval_loss": 2.2044458389282227, + "eval_meteor": 0.28455744709472686, + "eval_runtime": 909.0332, + "eval_samples_per_second": 18.919, + "eval_scarebleu_bp": 0.9788856147570383, + "eval_scarebleu_counts": [ + 98188, + 34902, + 13923, + 5651 + ], + "eval_scarebleu_precisions": [ + 40.003422299540844, + 15.29086018207786, + 6.595921074448682, + 2.9128415539965875 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.192067478873804, + "eval_scarebleu_sys_len": 245449, + "eval_scarebleu_totals": [ + 245449, + 228254, + 211085, + 194003 + ], + "eval_steps_per_second": 0.592, + "eval_ter_num_edits": 160712, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.59652697956211, + "step": 119500 + }, + { + "epoch": 47.0, + "learning_rate": 3.855625740228977e-05, + "loss": 2.1154, + "step": 120000 + }, + { + "epoch": 47.0, + "eval_bleu_bleu": 0.08679959487489236, + "eval_bleu_brevity_penalty": 0.9460169705814733, + "eval_bleu_length_ratio": 0.9474229789448504, + "eval_bleu_precisions": [ + 0.3762552546832572, + 0.13813556071271024, + 0.057221975495702605, + 0.023830006882312457 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 225751, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 31.54631624622082, + "eval_chrf_word_order": 2, + "eval_loss": 2.198996067047119, + "eval_meteor": 0.2847422962666821, + "eval_runtime": 880.0256, + "eval_samples_per_second": 19.543, + "eval_scarebleu_bp": 0.9761447195496443, + "eval_scarebleu_counts": [ + 98461, + 35015, + 13972, + 5666 + ], + "eval_scarebleu_precisions": [ + 40.224776020622855, + 15.385663189531686, + 6.6403372447257984, + 2.9307401851756065 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.226064722955998, + "eval_scarebleu_sys_len": 244777, + "eval_scarebleu_totals": [ + 244777, + 227582, + 210411, + 193330 + ], + "eval_steps_per_second": 0.611, + "eval_ter_num_edits": 160444, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.47379893666226, + "step": 120000 + }, + { + "epoch": 47.2, + "learning_rate": 3.8506908803789975e-05, + "loss": 2.0835, + "step": 120500 + }, + { + "epoch": 47.2, + "eval_bleu_bleu": 0.08701548270067755, + "eval_bleu_brevity_penalty": 0.9483806746712726, + "eval_bleu_length_ratio": 0.9496682460477004, + "eval_bleu_precisions": [ + 0.3741548306125876, + 0.13760994016959124, + 0.05731717483275327, + 0.02401427133839539 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 226286, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 31.54962093524476, + "eval_chrf_word_order": 2, + "eval_loss": 2.208310127258301, + "eval_meteor": 0.28474472818432445, + "eval_runtime": 878.937, + "eval_samples_per_second": 19.567, + "eval_scarebleu_bp": 0.9778586395329898, + "eval_scarebleu_counts": [ + 98138, + 35037, + 14035, + 5737 + ], + "eval_scarebleu_precisions": [ + 40.024143851678446, + 15.366970465171358, + 6.656959095393488, + 2.9610475408905335 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.26086493940443, + "eval_scarebleu_sys_len": 245197, + "eval_scarebleu_totals": [ + 245197, + 228002, + 210832, + 193749 + ], + "eval_steps_per_second": 0.612, + "eval_ter_num_edits": 160692, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.58736817039049, + "step": 120500 + }, + { + "epoch": 47.4, + "learning_rate": 3.845756020529017e-05, + "loss": 2.0939, + "step": 121000 + }, + { + "epoch": 47.4, + "eval_bleu_bleu": 0.08679227116781889, + "eval_bleu_brevity_penalty": 0.9461452322785205, + "eval_bleu_length_ratio": 0.9475446850121076, + "eval_bleu_precisions": [ + 0.37484276729559746, + 0.13777596663230818, + 0.05746345846436743, + 0.023860449913698685 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 225780, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 31.653848739461658, + "eval_chrf_word_order": 2, + "eval_loss": 2.206245183944702, + "eval_meteor": 0.2843712122655587, + "eval_runtime": 910.3648, + "eval_samples_per_second": 18.891, + "eval_scarebleu_bp": 0.9741701605009303, + "eval_scarebleu_counts": [ + 97982, + 34939, + 13983, + 5681 + ], + "eval_scarebleu_precisions": [ + 40.10823024716121, + 15.384920233026126, + 6.660791692468918, + 2.9458280831116572 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.218809951538287, + "eval_scarebleu_sys_len": 244294, + "eval_scarebleu_totals": [ + 244294, + 227099, + 209930, + 192849 + ], + "eval_steps_per_second": 0.591, + "eval_ter_num_edits": 160575, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.53378913673644, + "step": 121000 + }, + { + "epoch": 47.59, + "learning_rate": 3.840831030398737e-05, + "loss": 2.0963, + "step": 121500 + }, + { + "epoch": 47.59, + "eval_bleu_bleu": 0.08777019951032791, + "eval_bleu_brevity_penalty": 0.9500739804111344, + "eval_bleu_length_ratio": 0.9512798022486245, + "eval_bleu_precisions": [ + 0.3761371156306525, + 0.1387468671679198, + 0.05768570804604873, + 0.024194744588843378 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 226670, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 31.752253533908803, + "eval_chrf_word_order": 2, + "eval_loss": 2.1963233947753906, + "eval_meteor": 0.2866845035997963, + "eval_runtime": 876.692, + "eval_samples_per_second": 19.617, + "eval_scarebleu_bp": 0.9785189563392712, + "eval_scarebleu_counts": [ + 98705, + 35274, + 14120, + 5775 + ], + "eval_scarebleu_precisions": [ + 40.22880758398917, + 15.459932329377114, + 6.692069991848187, + 2.9780628925628356 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.32473742171055, + "eval_scarebleu_sys_len": 245359, + "eval_scarebleu_totals": [ + 245359, + 228164, + 210996, + 193918 + ], + "eval_steps_per_second": 0.614, + "eval_ter_num_edits": 160291, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.40373404649927, + "step": 121500 + }, + { + "epoch": 47.79, + "learning_rate": 3.8359060402684566e-05, + "loss": 2.1022, + "step": 122000 + }, + { + "epoch": 47.79, + "eval_bleu_bleu": 0.08815903186890459, + "eval_bleu_brevity_penalty": 0.9514829909583857, + "eval_bleu_length_ratio": 0.9526227657493946, + "eval_bleu_precisions": [ + 0.37639103044186967, + 0.13905955814008913, + 0.05797402381669245, + 0.024287878270179156 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 226990, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 31.844559879070356, + "eval_chrf_word_order": 2, + "eval_loss": 2.1964762210845947, + "eval_meteor": 0.28745492775829684, + "eval_runtime": 893.2904, + "eval_samples_per_second": 19.252, + "eval_scarebleu_bp": 0.9818344576970895, + "eval_scarebleu_counts": [ + 99018, + 35502, + 14254, + 5822 + ], + "eval_scarebleu_precisions": [ + 40.222769260766775, + 15.504478576638032, + 6.729647937528623, + 2.989811429275708 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.39153221992016, + "eval_scarebleu_sys_len": 246174, + "eval_scarebleu_totals": [ + 246174, + 228979, + 211809, + 194728 + ], + "eval_steps_per_second": 0.602, + "eval_ter_num_edits": 160102, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.31718329982736, + "step": 122000 + }, + { + "epoch": 47.98, + "learning_rate": 3.830971180418476e-05, + "loss": 2.1049, + "step": 122500 + }, + { + "epoch": 47.98, + "eval_bleu_bleu": 0.08762274598911442, + "eval_bleu_brevity_penalty": 0.9476654947212356, + "eval_bleu_length_ratio": 0.9489883707754355, + "eval_bleu_precisions": [ + 0.3770099591374644, + 0.13902330456758039, + 0.05769962819850966, + 0.024167610937517885 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 226124, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 31.702910767140118, + "eval_chrf_word_order": 2, + "eval_loss": 2.1909446716308594, + "eval_meteor": 0.2868452386695186, + "eval_runtime": 879.6542, + "eval_samples_per_second": 19.551, + "eval_scarebleu_bp": 0.9783437286410664, + "eval_scarebleu_counts": [ + 98802, + 35373, + 14151, + 5754 + ], + "eval_scarebleu_precisions": [ + 40.2753998923837, + 15.506244493054124, + 6.7082246977956865, + 2.9679682261309126 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.331057999410477, + "eval_scarebleu_sys_len": 245316, + "eval_scarebleu_totals": [ + 245316, + 228121, + 210950, + 193870 + ], + "eval_steps_per_second": 0.612, + "eval_ter_num_edits": 159966, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.25490339746025, + "step": 122500 + }, + { + "epoch": 48.18, + "learning_rate": 3.8260363205684966e-05, + "loss": 2.0681, + "step": 123000 + }, + { + "epoch": 48.18, + "eval_bleu_bleu": 0.0878519056358411, + "eval_bleu_brevity_penalty": 0.9504924774243725, + "eval_bleu_length_ratio": 0.9516784945379156, + "eval_bleu_precisions": [ + 0.37593984962406013, + 0.13870305864388988, + 0.05776756804515381, + 0.02422822083090994 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 226765, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 31.768089032657326, + "eval_chrf_word_order": 2, + "eval_loss": 2.1915793418884277, + "eval_meteor": 0.28692571586952237, + "eval_runtime": 892.4229, + "eval_samples_per_second": 19.271, + "eval_scarebleu_bp": 0.9790281686121539, + "eval_scarebleu_counts": [ + 98646, + 35288, + 14152, + 5784 + ], + "eval_scarebleu_precisions": [ + 40.18428899643154, + 15.457599796748857, + 6.7034237101877645, + 2.9809362324965343 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.333730084308625, + "eval_scarebleu_sys_len": 245484, + "eval_scarebleu_totals": [ + 245484, + 228289, + 211116, + 194033 + ], + "eval_steps_per_second": 0.603, + "eval_ter_num_edits": 160204, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.36389322660267, + "step": 123000 + }, + { + "epoch": 48.37, + "learning_rate": 3.8211014607185155e-05, + "loss": 2.0797, + "step": 123500 + }, + { + "epoch": 48.37, + "eval_bleu_bleu": 0.08784536768311836, + "eval_bleu_brevity_penalty": 0.9528110144915772, + "eval_bleu_length_ratio": 0.9538901875532464, + "eval_bleu_precisions": [ + 0.37594811959945795, + 0.13881207251888414, + 0.05768174232136749, + 0.024002410474192576 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 227292, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 31.760490118222528, + "eval_chrf_word_order": 2, + "eval_loss": 2.1912484169006348, + "eval_meteor": 0.28711065191427415, + "eval_runtime": 887.4593, + "eval_samples_per_second": 19.379, + "eval_scarebleu_bp": 0.9816476118788745, + "eval_scarebleu_counts": [ + 98953, + 35449, + 14203, + 5774 + ], + "eval_scarebleu_precisions": [ + 40.203877657154, + 15.484443046655572, + 6.7070262510448, + 2.965862277971256 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.355396776868036, + "eval_scarebleu_sys_len": 246128, + "eval_scarebleu_totals": [ + 246128, + 228933, + 211763, + 194682 + ], + "eval_steps_per_second": 0.606, + "eval_ter_num_edits": 160173, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.34969707238665, + "step": 123500 + }, + { + "epoch": 48.57, + "learning_rate": 3.816166600868535e-05, + "loss": 2.0825, + "step": 124000 + }, + { + "epoch": 48.57, + "eval_bleu_bleu": 0.0876210073958691, + "eval_bleu_brevity_penalty": 0.9474049074833304, + "eval_bleu_length_ratio": 0.948740761879981, + "eval_bleu_precisions": [ + 0.377714374184416, + 0.13934983482548954, + 0.05774376789822074, + 0.024072176456781714 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 226065, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 31.7435874075715, + "eval_chrf_word_order": 2, + "eval_loss": 2.186969757080078, + "eval_meteor": 0.28692331641474733, + "eval_runtime": 869.597, + "eval_samples_per_second": 19.777, + "eval_scarebleu_bp": 0.9773610822995041, + "eval_scarebleu_counts": [ + 98906, + 35384, + 14089, + 5718 + ], + "eval_scarebleu_precisions": [ + 40.35744159951035, + 15.527470598560646, + 6.686504546576304, + 2.952978542102409 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.308037416149732, + "eval_scarebleu_sys_len": 245075, + "eval_scarebleu_totals": [ + 245075, + 227880, + 210708, + 193635 + ], + "eval_steps_per_second": 0.619, + "eval_ter_num_edits": 159971, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.25719309975317, + "step": 124000 + }, + { + "epoch": 48.77, + "learning_rate": 3.8112317410185555e-05, + "loss": 2.0855, + "step": 124500 + }, + { + "epoch": 48.77, + "eval_bleu_bleu": 0.08827672907227922, + "eval_bleu_brevity_penalty": 0.9488439583227515, + "eval_bleu_length_ratio": 0.9501089059463905, + "eval_bleu_precisions": [ + 0.3767464254321064, + 0.1395581177460372, + 0.05833220508441038, + 0.024428292248088592 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 226391, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 31.895469071389382, + "eval_chrf_word_order": 2, + "eval_loss": 2.186830520629883, + "eval_meteor": 0.2869834623378739, + "eval_runtime": 891.8751, + "eval_samples_per_second": 19.283, + "eval_scarebleu_bp": 0.9763815745678373, + "eval_scarebleu_counts": [ + 98650, + 35433, + 14246, + 5827 + ], + "eval_scarebleu_precisions": [ + 40.292441848591906, + 15.565366367949395, + 6.768660616714971, + 3.013051212046 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.383472619417747, + "eval_scarebleu_sys_len": 244835, + "eval_scarebleu_totals": [ + 244835, + 227640, + 210470, + 193392 + ], + "eval_steps_per_second": 0.603, + "eval_ter_num_edits": 160063, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.29932362194268, + "step": 124500 + }, + { + "epoch": 48.96, + "learning_rate": 3.806296881168575e-05, + "loss": 2.0914, + "step": 125000 + }, + { + "epoch": 48.96, + "eval_bleu_bleu": 0.08868560003116538, + "eval_bleu_brevity_penalty": 0.9531581343853831, + "eval_bleu_length_ratio": 0.954221731667499, + "eval_bleu_precisions": [ + 0.37543046386742374, + 0.1393784257003654, + 0.058196946382961086, + 0.02461089107223021 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 227371, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 31.85039742830893, + "eval_chrf_word_order": 2, + "eval_loss": 2.1884920597076416, + "eval_meteor": 0.28713076741048793, + "eval_runtime": 873.0916, + "eval_samples_per_second": 19.698, + "eval_scarebleu_bp": 0.9777363118319459, + "eval_scarebleu_counts": [ + 98474, + 35432, + 14230, + 5858 + ], + "eval_scarebleu_precisions": [ + 40.16609086867319, + 15.542259575737372, + 6.750410337662831, + 3.0239520958083834 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.388227349559825, + "eval_scarebleu_sys_len": 245167, + "eval_scarebleu_totals": [ + 245167, + 227972, + 210802, + 193720 + ], + "eval_steps_per_second": 0.616, + "eval_ter_num_edits": 160425, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.46509806794921, + "step": 125000 + }, + { + "epoch": 49.16, + "learning_rate": 3.801362021318595e-05, + "loss": 2.0682, + "step": 125500 + }, + { + "epoch": 49.16, + "eval_bleu_bleu": 0.0885649200739642, + "eval_bleu_brevity_penalty": 0.948976287691438, + "eval_bleu_length_ratio": 0.9502348087745878, + "eval_bleu_precisions": [ + 0.37687316989148534, + 0.13981053979906896, + 0.05849980996412747, + 0.024611376763158346 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 226421, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 31.873959683677143, + "eval_chrf_word_order": 2, + "eval_loss": 2.1884639263153076, + "eval_meteor": 0.28757440179315863, + "eval_runtime": 892.2872, + "eval_samples_per_second": 19.274, + "eval_scarebleu_bp": 0.979081112120267, + "eval_scarebleu_counts": [ + 98850, + 35545, + 14348, + 5890 + ], + "eval_scarebleu_precisions": [ + 40.26525782392453, + 15.569289800352164, + 6.795813006204708, + 3.035237614272316 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.440637641255456, + "eval_scarebleu_sys_len": 245497, + "eval_scarebleu_totals": [ + 245497, + 228302, + 211130, + 194054 + ], + "eval_steps_per_second": 0.603, + "eval_ter_num_edits": 160175, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.35061295330381, + "step": 125500 + }, + { + "epoch": 49.35, + "learning_rate": 3.7964370311883145e-05, + "loss": 2.0741, + "step": 126000 + }, + { + "epoch": 49.35, + "eval_bleu_bleu": 0.08942324099288965, + "eval_bleu_brevity_penalty": 0.9547560396825917, + "eval_bleu_length_ratio": 0.955749352649625, + "eval_bleu_precisions": [ + 0.37696006323138737, + 0.139788163769355, + 0.05885242680290823, + 0.024814289764672526 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 227735, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 31.994768522867417, + "eval_chrf_word_order": 2, + "eval_loss": 2.1806511878967285, + "eval_meteor": 0.28891492977038447, + "eval_runtime": 896.8436, + "eval_samples_per_second": 19.176, + "eval_scarebleu_bp": 0.9804038083054253, + "eval_scarebleu_counts": [ + 99062, + 35634, + 14423, + 5935 + ], + "eval_scarebleu_precisions": [ + 40.29826459796113, + 15.586085632930494, + 6.820804328087167, + 3.0532662489325144 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.484818262566527, + "eval_scarebleu_sys_len": 245822, + "eval_scarebleu_totals": [ + 245822, + 228627, + 211456, + 194382 + ], + "eval_steps_per_second": 0.6, + "eval_ter_num_edits": 159856, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.20452994701628, + "step": 126000 + }, + { + "epoch": 49.55, + "learning_rate": 3.791502171338334e-05, + "loss": 2.062, + "step": 126500 + }, + { + "epoch": 49.55, + "eval_bleu_bleu": 0.08957081895194714, + "eval_bleu_brevity_penalty": 0.9505849648328949, + "eval_bleu_length_ratio": 0.9517666265176536, + "eval_bleu_precisions": [ + 0.37822440538657587, + 0.14081234404149034, + 0.05908122434131892, + 0.02505316813674902 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 226786, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.03376282417516, + "eval_chrf_word_order": 2, + "eval_loss": 2.182044506072998, + "eval_meteor": 0.2890494050443951, + "eval_runtime": 886.1517, + "eval_samples_per_second": 19.408, + "eval_scarebleu_bp": 0.9771611756064884, + "eval_scarebleu_counts": [ + 99090, + 35758, + 14420, + 5952 + ], + "eval_scarebleu_precisions": [ + 40.44060630300458, + 15.694966883347744, + 6.845218315943377, + 3.0747454501309557 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.505333321329516, + "eval_scarebleu_sys_len": 245026, + "eval_scarebleu_totals": [ + 245026, + 227831, + 210658, + 193577 + ], + "eval_steps_per_second": 0.607, + "eval_ter_num_edits": 159896, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.22284756535954, + "step": 126500 + }, + { + "epoch": 49.75, + "learning_rate": 3.786567311488354e-05, + "loss": 2.065, + "step": 127000 + }, + { + "epoch": 49.75, + "eval_bleu_bleu": 0.08938996729125519, + "eval_bleu_brevity_penalty": 0.9525033439461745, + "eval_bleu_length_ratio": 0.9535964142874529, + "eval_bleu_precisions": [ + 0.3773490243022243, + 0.14013912496964676, + 0.05885921386240259, + 0.0249213742585294 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 227222, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 31.978261704010695, + "eval_chrf_word_order": 2, + "eval_loss": 2.1767001152038574, + "eval_meteor": 0.28872100964989644, + "eval_runtime": 895.7867, + "eval_samples_per_second": 19.199, + "eval_scarebleu_bp": 0.9815135491987658, + "eval_scarebleu_counts": [ + 99214, + 35771, + 14444, + 5915 + ], + "eval_scarebleu_precisions": [ + 40.31532538247425, + 15.627348186981214, + 6.821960250887932, + 3.038834402790693 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.492747412197518, + "eval_scarebleu_sys_len": 246095, + "eval_scarebleu_totals": [ + 246095, + 228900, + 211728, + 194647 + ], + "eval_steps_per_second": 0.601, + "eval_ter_num_edits": 159883, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.21689433939798, + "step": 127000 + }, + { + "epoch": 49.94, + "learning_rate": 3.781632451638374e-05, + "loss": 2.0683, + "step": 127500 + }, + { + "epoch": 49.94, + "eval_bleu_bleu": 0.08959690893960834, + "eval_bleu_brevity_penalty": 0.9523494748557355, + "eval_bleu_length_ratio": 0.9534495276545563, + "eval_bleu_precisions": [ + 0.3779969804610299, + 0.1404815421539868, + 0.05898398606040491, + 0.025011803386860983 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 227187, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.036740392419794, + "eval_chrf_word_order": 2, + "eval_loss": 2.175442695617676, + "eval_meteor": 0.2889235480726086, + "eval_runtime": 902.1668, + "eval_samples_per_second": 19.063, + "eval_scarebleu_bp": 0.9817857186139594, + "eval_scarebleu_counts": [ + 99433, + 35842, + 14479, + 5960 + ], + "eval_scarebleu_precisions": [ + 40.39331822133392, + 15.653784169771189, + 6.836359859108379, + 3.0608838558919444 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.529721146163528, + "eval_scarebleu_sys_len": 246162, + "eval_scarebleu_totals": [ + 246162, + 228967, + 211794, + 194715 + ], + "eval_steps_per_second": 0.596, + "eval_ter_num_edits": 159813, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.18483850729727, + "step": 127500 + }, + { + "epoch": 50.14, + "learning_rate": 3.776707461508093e-05, + "loss": 2.0551, + "step": 128000 + }, + { + "epoch": 50.14, + "eval_bleu_bleu": 0.08928234712265935, + "eval_bleu_brevity_penalty": 0.9480010716164256, + "eval_bleu_length_ratio": 0.9493073246068684, + "eval_bleu_precisions": [ + 0.37852785145888596, + 0.14062343006148179, + 0.05905778593246667, + 0.02502617022371966 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 226200, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.07358364350697, + "eval_chrf_word_order": 2, + "eval_loss": 2.1779286861419678, + "eval_meteor": 0.2883233717997101, + "eval_runtime": 895.1281, + "eval_samples_per_second": 19.213, + "eval_scarebleu_bp": 0.977801555093336, + "eval_scarebleu_counts": [ + 99189, + 35799, + 14444, + 5965 + ], + "eval_scarebleu_precisions": [ + 40.45508864807103, + 15.702142218011474, + 6.851472374013357, + 3.078836803584148 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.520257854571284, + "eval_scarebleu_sys_len": 245183, + "eval_scarebleu_totals": [ + 245183, + 227988, + 210816, + 193742 + ], + "eval_steps_per_second": 0.601, + "eval_ter_num_edits": 159734, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.14866121106934, + "step": 128000 + }, + { + "epoch": 50.33, + "learning_rate": 3.771772601658113e-05, + "loss": 2.0441, + "step": 128500 + }, + { + "epoch": 50.33, + "eval_bleu_bleu": 0.09000202637085622, + "eval_bleu_brevity_penalty": 0.951174931162496, + "eval_bleu_length_ratio": 0.9523289924836011, + "eval_bleu_precisions": [ + 0.3791159880133968, + 0.14128024794373584, + 0.059407894395197516, + 0.02519241834682588 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 226920, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.11528778506194, + "eval_chrf_word_order": 2, + "eval_loss": 2.1781351566314697, + "eval_meteor": 0.2898215962482735, + "eval_runtime": 914.3024, + "eval_samples_per_second": 18.81, + "eval_scarebleu_bp": 0.9800132825637382, + "eval_scarebleu_counts": [ + 99535, + 35988, + 14535, + 5973 + ], + "eval_scarebleu_precisions": [ + 40.50649910876342, + 15.747535345314203, + 6.876892505677517, + 3.074397010531084 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.560982756656069, + "eval_scarebleu_sys_len": 245726, + "eval_scarebleu_totals": [ + 245726, + 228531, + 211360, + 194282 + ], + "eval_steps_per_second": 0.588, + "eval_ter_num_edits": 159622, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.09737187970819, + "step": 128500 + }, + { + "epoch": 50.53, + "learning_rate": 3.766837741808133e-05, + "loss": 2.0483, + "step": 129000 + }, + { + "epoch": 50.53, + "eval_bleu_bleu": 0.08894482780498306, + "eval_bleu_brevity_penalty": 0.9488968920640124, + "eval_bleu_length_ratio": 0.9501592670776694, + "eval_bleu_precisions": [ + 0.378873071469901, + 0.14071163626629957, + 0.05873470450403541, + 0.024654043491675333 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 226403, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.01104609381887, + "eval_chrf_word_order": 2, + "eval_loss": 2.174912691116333, + "eval_meteor": 0.2892846818539126, + "eval_runtime": 896.4477, + "eval_samples_per_second": 19.185, + "eval_scarebleu_bp": 0.9760671172026242, + "eval_scarebleu_counts": [ + 99170, + 35779, + 14355, + 5868 + ], + "eval_scarebleu_precisions": [ + 40.51757245932717, + 15.722678994388367, + 6.822913200946795, + 3.0353503481238557 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.460846787244277, + "eval_scarebleu_sys_len": 244758, + "eval_scarebleu_totals": [ + 244758, + 227563, + 210394, + 193322 + ], + "eval_steps_per_second": 0.6, + "eval_ter_num_edits": 159774, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.1669788294126, + "step": 129000 + }, + { + "epoch": 50.72, + "learning_rate": 3.761902881958153e-05, + "loss": 2.057, + "step": 129500 + }, + { + "epoch": 50.72, + "eval_bleu_bleu": 0.08881621600428104, + "eval_bleu_brevity_penalty": 0.948468934872636, + "eval_bleu_length_ratio": 0.9497521812664985, + "eval_bleu_precisions": [ + 0.3785582353097134, + 0.141025579716036, + 0.05868164271090018, + 0.024543910903259372 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 226306, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.02894999557879, + "eval_chrf_word_order": 2, + "eval_loss": 2.1716012954711914, + "eval_meteor": 0.28875181297262453, + "eval_runtime": 890.4779, + "eval_samples_per_second": 19.313, + "eval_scarebleu_bp": 0.9788733949294742, + "eval_scarebleu_counts": [ + 99279, + 35846, + 14390, + 5857 + ], + "eval_scarebleu_precisions": [ + 40.44840820384117, + 15.704640943522701, + 6.817385042496139, + 3.0190566028010166 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.467215275990542, + "eval_scarebleu_sys_len": 245446, + "eval_scarebleu_totals": [ + 245446, + 228251, + 211078, + 194001 + ], + "eval_steps_per_second": 0.604, + "eval_ter_num_edits": 159614, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.09370835603954, + "step": 129500 + }, + { + "epoch": 50.92, + "learning_rate": 3.7569680221081724e-05, + "loss": 2.0658, + "step": 130000 + }, + { + "epoch": 50.92, + "eval_bleu_bleu": 0.08976886928996744, + "eval_bleu_brevity_penalty": 0.9525253234042387, + "eval_bleu_length_ratio": 0.9536173980921525, + "eval_bleu_precisions": [ + 0.378718198101458, + 0.1415403367105965, + 0.05918859364873623, + 0.02486351228389445 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 227227, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.229176491265136, + "eval_chrf_word_order": 2, + "eval_loss": 2.1695849895477295, + "eval_meteor": 0.29022692385723864, + "eval_runtime": 918.1897, + "eval_samples_per_second": 18.73, + "eval_scarebleu_bp": 0.980985251819307, + "eval_scarebleu_counts": [ + 99571, + 36136, + 14526, + 5969 + ], + "eval_scarebleu_precisions": [ + 40.48177586241945, + 15.795777418367793, + 6.8648393194707, + 3.0684686444555256 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.56819054702119, + "eval_scarebleu_sys_len": 245965, + "eval_scarebleu_totals": [ + 245965, + 228770, + 211600, + 194527 + ], + "eval_steps_per_second": 0.586, + "eval_ter_num_edits": 159518, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.04974607201572, + "step": 130000 + }, + { + "epoch": 51.12, + "learning_rate": 3.752033162258192e-05, + "loss": 2.0436, + "step": 130500 + }, + { + "epoch": 51.12, + "eval_bleu_bleu": 0.08973163245339678, + "eval_bleu_brevity_penalty": 0.9532328160601072, + "eval_bleu_length_ratio": 0.9542930766034774, + "eval_bleu_precisions": [ + 0.3786743363765898, + 0.14134628650811398, + 0.05905695369727613, + 0.024840767950182103 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 227388, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.24596279542692, + "eval_chrf_word_order": 2, + "eval_loss": 2.1723663806915283, + "eval_meteor": 0.2906259514752742, + "eval_runtime": 895.091, + "eval_samples_per_second": 19.214, + "eval_scarebleu_bp": 0.9815379255437213, + "eval_scarebleu_counts": [ + 99602, + 36081, + 14536, + 5979 + ], + "eval_scarebleu_precisions": [ + 40.472001332786135, + 15.762365337736888, + 6.865152831828315, + 3.0714935195031363 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.57063448100571, + "eval_scarebleu_sys_len": 246101, + "eval_scarebleu_totals": [ + 246101, + 228906, + 211736, + 194661 + ], + "eval_steps_per_second": 0.601, + "eval_ter_num_edits": 159508, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.04516666742991, + "step": 130500 + }, + { + "epoch": 51.31, + "learning_rate": 3.747098302408212e-05, + "loss": 2.0304, + "step": 131000 + }, + { + "epoch": 51.31, + "eval_bleu_bleu": 0.0895093740624443, + "eval_bleu_brevity_penalty": 0.9466271801955192, + "eval_bleu_length_ratio": 0.9480021319545575, + "eval_bleu_precisions": [ + 0.3796599214658527, + 0.14172903868822295, + 0.059404286422847, + 0.025008452673623647 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 225889, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.12436303947929, + "eval_chrf_word_order": 2, + "eval_loss": 2.167572259902954, + "eval_meteor": 0.28967609645132514, + "eval_runtime": 885.9262, + "eval_samples_per_second": 19.412, + "eval_scarebleu_bp": 0.977854562178684, + "eval_scarebleu_counts": [ + 99412, + 35996, + 14543, + 5966 + ], + "eval_scarebleu_precisions": [ + 40.543891417478264, + 15.787650054166429, + 6.897941953507786, + 3.0791145610223114 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.55896480739287, + "eval_scarebleu_sys_len": 245196, + "eval_scarebleu_totals": [ + 245196, + 228001, + 210831, + 193757 + ], + "eval_steps_per_second": 0.607, + "eval_ter_num_edits": 159566, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.07172721402763, + "step": 131000 + }, + { + "epoch": 51.51, + "learning_rate": 3.742163442558231e-05, + "loss": 2.0373, + "step": 131500 + }, + { + "epoch": 51.51, + "eval_bleu_bleu": 0.08996462515483028, + "eval_bleu_brevity_penalty": 0.9480893635885063, + "eval_bleu_length_ratio": 0.9493912598256665, + "eval_bleu_precisions": [ + 0.3796348687118734, + 0.14218873340509508, + 0.059750033877810554, + 0.025137412133448486 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 226220, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.25543210909955, + "eval_chrf_word_order": 2, + "eval_loss": 2.1680328845977783, + "eval_meteor": 0.2900165121699001, + "eval_runtime": 878.216, + "eval_samples_per_second": 19.583, + "eval_scarebleu_bp": 0.9749350888893062, + "eval_scarebleu_counts": [ + 99269, + 36008, + 14550, + 5953 + ], + "eval_scarebleu_precisions": [ + 40.603973314899726, + 15.84259479246412, + 6.924746330598336, + 3.083720978419651 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.554657607883922, + "eval_scarebleu_sys_len": 244481, + "eval_scarebleu_totals": [ + 244481, + 227286, + 210116, + 193046 + ], + "eval_steps_per_second": 0.613, + "eval_ter_num_edits": 159298, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.94899917112777, + "step": 131500 + }, + { + "epoch": 51.7, + "learning_rate": 3.737238452427951e-05, + "loss": 2.0431, + "step": 132000 + }, + { + "epoch": 51.7, + "eval_bleu_bleu": 0.09117278687596785, + "eval_bleu_brevity_penalty": 0.9565442055287554, + "eval_bleu_length_ratio": 0.9574616311131069, + "eval_bleu_precisions": [ + 0.3792840455328456, + 0.14231469366858182, + 0.06004499762627201, + 0.025465346534653464 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228143, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.335028729831464, + "eval_chrf_word_order": 2, + "eval_loss": 2.165398359298706, + "eval_meteor": 0.2917418510693046, + "eval_runtime": 889.7939, + "eval_samples_per_second": 19.328, + "eval_scarebleu_bp": 0.9829872688175166, + "eval_scarebleu_counts": [ + 99902, + 36288, + 14705, + 6056 + ], + "eval_scarebleu_precisions": [ + 40.53510131543711, + 15.828110074455974, + 6.93327926899992, + 3.105465845516407 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.656861877954256, + "eval_scarebleu_sys_len": 246458, + "eval_scarebleu_totals": [ + 246458, + 229263, + 212093, + 195011 + ], + "eval_steps_per_second": 0.605, + "eval_ter_num_edits": 159221, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.91373775581698, + "step": 132000 + }, + { + "epoch": 51.9, + "learning_rate": 3.732303592577971e-05, + "loss": 2.0537, + "step": 132500 + }, + { + "epoch": 51.9, + "eval_bleu_bleu": 0.09005710195839348, + "eval_bleu_brevity_penalty": 0.9562726712906505, + "eval_bleu_length_ratio": 0.9572014319348326, + "eval_bleu_precisions": [ + 0.37832612098333485, + 0.14084386825109302, + 0.05895895275850677, + 0.025037493986813434 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228081, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.284486616320955, + "eval_chrf_word_order": 2, + "eval_loss": 2.1634762287139893, + "eval_meteor": 0.2908909543355116, + "eval_runtime": 886.7754, + "eval_samples_per_second": 19.394, + "eval_scarebleu_bp": 0.9828128073350563, + "eval_scarebleu_counts": [ + 99701, + 36045, + 14532, + 6005 + ], + "eval_scarebleu_precisions": [ + 40.46060507680133, + 15.725067620626472, + 6.853068365629023, + 3.0798504438985113 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.579879079349295, + "eval_scarebleu_sys_len": 246415, + "eval_scarebleu_totals": [ + 246415, + 229220, + 212051, + 194977 + ], + "eval_steps_per_second": 0.607, + "eval_ter_num_edits": 159536, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 73.05798900027018, + "step": 132500 + }, + { + "epoch": 52.1, + "learning_rate": 3.7273687327279903e-05, + "loss": 2.0366, + "step": 133000 + }, + { + "epoch": 52.1, + "eval_bleu_bleu": 0.09087562531773268, + "eval_bleu_brevity_penalty": 0.9521076350112606, + "eval_bleu_length_ratio": 0.9532187058028614, + "eval_bleu_precisions": [ + 0.37993325467129246, + 0.14230459614074698, + 0.06004346991601695, + 0.025565449941676862 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 227132, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.41500474890028, + "eval_chrf_word_order": 2, + "eval_loss": 2.1658763885498047, + "eval_meteor": 0.29193886022008, + "eval_runtime": 886.9906, + "eval_samples_per_second": 19.389, + "eval_scarebleu_bp": 0.9818791331411618, + "eval_scarebleu_counts": [ + 99959, + 36334, + 14747, + 6099 + ], + "eval_scarebleu_precisions": [ + 40.60320490687897, + 15.867068430935849, + 6.962108980351056, + 3.1317877224062234 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.689455077710095, + "eval_scarebleu_sys_len": 246185, + "eval_scarebleu_totals": [ + 246185, + 228990, + 211818, + 194745 + ], + "eval_steps_per_second": 0.607, + "eval_ter_num_edits": 159251, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.92747596957445, + "step": 133000 + }, + { + "epoch": 52.29, + "learning_rate": 3.7224338728780107e-05, + "loss": 2.0268, + "step": 133500 + }, + { + "epoch": 52.29, + "eval_bleu_bleu": 0.09030987837362191, + "eval_bleu_brevity_penalty": 0.9523934397538023, + "eval_bleu_length_ratio": 0.9534914952639553, + "eval_bleu_precisions": [ + 0.379203950756392, + 0.14226531175893564, + 0.05962394084276247, + 0.025135231984710682 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 227197, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.33047935871033, + "eval_chrf_word_order": 2, + "eval_loss": 2.165220022201538, + "eval_meteor": 0.2908637119775906, + "eval_runtime": 889.3477, + "eval_samples_per_second": 19.338, + "eval_scarebleu_bp": 0.9802085641209763, + "eval_scarebleu_counts": [ + 99630, + 36261, + 14631, + 6004 + ], + "eval_scarebleu_precisions": [ + 40.53724153083727, + 15.863662016195713, + 6.920773673530205, + 3.089589872896619 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.614432335411312, + "eval_scarebleu_sys_len": 245774, + "eval_scarebleu_totals": [ + 245774, + 228579, + 211407, + 194330 + ], + "eval_steps_per_second": 0.605, + "eval_ter_num_edits": 159362, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.97830736047699, + "step": 133500 + }, + { + "epoch": 52.49, + "learning_rate": 3.71750888274773e-05, + "loss": 2.0196, + "step": 134000 + }, + { + "epoch": 52.49, + "eval_bleu_bleu": 0.09126656826011342, + "eval_bleu_brevity_penalty": 0.9565704792937577, + "eval_bleu_length_ratio": 0.9574868116787464, + "eval_bleu_precisions": [ + 0.37932228499796183, + 0.14232012666268476, + 0.059944477698198106, + 0.025606789250353607 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228149, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.43689140968936, + "eval_chrf_word_order": 2, + "eval_loss": 2.1638407707214355, + "eval_meteor": 0.2922002092149941, + "eval_runtime": 912.2314, + "eval_samples_per_second": 18.853, + "eval_scarebleu_bp": 0.9836442737091105, + "eval_scarebleu_counts": [ + 99978, + 36397, + 14728, + 6107 + ], + "eval_scarebleu_precisions": [ + 40.53929121725732, + 15.864443717990628, + 6.938921659159867, + 3.1290990326282997 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.692792547708393, + "eval_scarebleu_sys_len": 246620, + "eval_scarebleu_totals": [ + 246620, + 229425, + 212252, + 195168 + ], + "eval_steps_per_second": 0.59, + "eval_ter_num_edits": 159307, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.953120635255, + "step": 134000 + }, + { + "epoch": 52.68, + "learning_rate": 3.71257402289775e-05, + "loss": 2.0306, + "step": 134500 + }, + { + "epoch": 52.68, + "eval_bleu_bleu": 0.09103465793950112, + "eval_bleu_brevity_penalty": 0.9513773806264898, + "eval_bleu_length_ratio": 0.9525220434868369, + "eval_bleu_precisions": [ + 0.3804446480970718, + 0.14254591912132755, + 0.0603142133244725, + 0.025630072618539085 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 226966, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.32388327124968, + "eval_chrf_word_order": 2, + "eval_loss": 2.1580235958099365, + "eval_meteor": 0.29166045991526707, + "eval_runtime": 881.0586, + "eval_samples_per_second": 19.52, + "eval_scarebleu_bp": 0.9809120813641035, + "eval_scarebleu_counts": [ + 99928, + 36370, + 14769, + 6107 + ], + "eval_scarebleu_precisions": [ + 40.629891805958195, + 15.899314541512206, + 6.98043738213511, + 3.139861901603607 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.700015234107369, + "eval_scarebleu_sys_len": 245947, + "eval_scarebleu_totals": [ + 245947, + 228752, + 211577, + 194499 + ], + "eval_steps_per_second": 0.611, + "eval_ter_num_edits": 159169, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.88992485197075, + "step": 134500 + }, + { + "epoch": 52.88, + "learning_rate": 3.70763916304777e-05, + "loss": 2.0332, + "step": 135000 + }, + { + "epoch": 52.88, + "eval_bleu_bleu": 0.09060363486018075, + "eval_bleu_brevity_penalty": 0.9511441202175546, + "eval_bleu_length_ratio": 0.9522996151570218, + "eval_bleu_precisions": [ + 0.37994297373883384, + 0.14227677166480704, + 0.05979559193169779, + 0.025472735456156245 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 226913, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.382350691593246, + "eval_chrf_word_order": 2, + "eval_loss": 2.156738519668579, + "eval_meteor": 0.2910406465865864, + "eval_runtime": 888.4447, + "eval_samples_per_second": 19.357, + "eval_scarebleu_bp": 0.9794475688438128, + "eval_scarebleu_counts": [ + 99793, + 36211, + 14624, + 6058 + ], + "eval_scarebleu_precisions": [ + 40.63447983810218, + 15.854758485411047, + 6.923586781554777, + 3.1203321211871478 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.638435551850314, + "eval_scarebleu_sys_len": 245587, + "eval_scarebleu_totals": [ + 245587, + 228392, + 211220, + 194146 + ], + "eval_steps_per_second": 0.606, + "eval_ter_num_edits": 159265, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.93388713599458, + "step": 135000 + }, + { + "epoch": 53.07, + "learning_rate": 3.702704303197789e-05, + "loss": 2.022, + "step": 135500 + }, + { + "epoch": 53.07, + "eval_bleu_bleu": 0.09154107271497687, + "eval_bleu_brevity_penalty": 0.9495803806643658, + "eval_bleu_length_ratio": 0.950809765023355, + "eval_bleu_precisions": [ + 0.38078549422223007, + 0.14362136576185858, + 0.06082079457243346, + 0.025964832153459693 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 226558, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.42191647011873, + "eval_chrf_word_order": 2, + "eval_loss": 2.1572072505950928, + "eval_meteor": 0.2918840493337756, + "eval_runtime": 898.6144, + "eval_samples_per_second": 19.138, + "eval_scarebleu_bp": 0.9772019760626239, + "eval_scarebleu_counts": [ + 99732, + 36445, + 14820, + 6149 + ], + "eval_scarebleu_precisions": [ + 40.700958226546305, + 15.99580409144974, + 7.034698818056676, + 3.1763660595290983 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.732008993151025, + "eval_scarebleu_sys_len": 245036, + "eval_scarebleu_totals": [ + 245036, + 227841, + 210670, + 193586 + ], + "eval_steps_per_second": 0.599, + "eval_ter_num_edits": 159138, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.87572869775471, + "step": 135500 + }, + { + "epoch": 53.27, + "learning_rate": 3.697779313067509e-05, + "loss": 1.9961, + "step": 136000 + }, + { + "epoch": 53.27, + "eval_bleu_bleu": 0.09103154067687554, + "eval_bleu_brevity_penalty": 0.952718722795932, + "eval_bleu_length_ratio": 0.9538020555735084, + "eval_bleu_precisions": [ + 0.38032129044180735, + 0.14278642015270665, + 0.06006821692567672, + 0.025552093520434853 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 227271, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.50475355981454, + "eval_chrf_word_order": 2, + "eval_loss": 2.156723737716675, + "eval_meteor": 0.29178249336450646, + "eval_runtime": 896.0651, + "eval_samples_per_second": 19.193, + "eval_scarebleu_bp": 0.9832914905146276, + "eval_scarebleu_counts": [ + 100174, + 36519, + 14811, + 6129 + ], + "eval_scarebleu_precisions": [ + 40.633099828420534, + 15.923658530204328, + 6.980920420052413, + 3.1417074608503985 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.732047623423812, + "eval_scarebleu_sys_len": 246533, + "eval_scarebleu_totals": [ + 246533, + 229338, + 212164, + 195085 + ], + "eval_steps_per_second": 0.6, + "eval_ter_num_edits": 159096, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.85649519849429, + "step": 136000 + }, + { + "epoch": 53.47, + "learning_rate": 3.692844453217529e-05, + "loss": 2.0156, + "step": 136500 + }, + { + "epoch": 53.47, + "eval_bleu_bleu": 0.09106521064386212, + "eval_bleu_brevity_penalty": 0.9509460282975083, + "eval_bleu_length_ratio": 0.952110760914726, + "eval_bleu_precisions": [ + 0.380653066981681, + 0.1431276320747068, + 0.060167677859042555, + 0.02565490674310332 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 226868, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.469794063424, + "eval_chrf_word_order": 2, + "eval_loss": 2.1539578437805176, + "eval_meteor": 0.2917564994216096, + "eval_runtime": 882.1623, + "eval_samples_per_second": 19.495, + "eval_scarebleu_bp": 0.9776792205639764, + "eval_scarebleu_counts": [ + 99739, + 36367, + 14724, + 6106 + ], + "eval_scarebleu_precisions": [ + 40.68438893262575, + 15.953377376534274, + 6.985349931683619, + 3.152118361889619 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.689666713282115, + "eval_scarebleu_sys_len": 245153, + "eval_scarebleu_totals": [ + 245153, + 227958, + 210784, + 193711 + ], + "eval_steps_per_second": 0.61, + "eval_ter_num_edits": 158988, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.80703762896749, + "step": 136500 + }, + { + "epoch": 53.66, + "learning_rate": 3.6879095933675484e-05, + "loss": 2.017, + "step": 137000 + }, + { + "epoch": 53.66, + "eval_bleu_bleu": 0.09152560415629006, + "eval_bleu_brevity_penalty": 0.9558564739457378, + "eval_bleu_length_ratio": 0.9568027396455415, + "eval_bleu_precisions": [ + 0.3795583939364698, + 0.1427859823237235, + 0.06022764832259131, + 0.02575369770549729 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 227986, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.5242443360306, + "eval_chrf_word_order": 2, + "eval_loss": 2.153320074081421, + "eval_meteor": 0.29271320943033485, + "eval_runtime": 904.7234, + "eval_samples_per_second": 19.009, + "eval_scarebleu_bp": 0.9848193340831117, + "eval_scarebleu_counts": [ + 100192, + 36562, + 14878, + 6174 + ], + "eval_scarebleu_precisions": [ + 40.578348386051594, + 15.91624404152972, + 6.999929426709638, + 3.1585894294177534 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.76556964604203, + "eval_scarebleu_sys_len": 246910, + "eval_scarebleu_totals": [ + 246910, + 229715, + 212545, + 195467 + ], + "eval_steps_per_second": 0.595, + "eval_ter_num_edits": 159124, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.86931753133457, + "step": 137000 + }, + { + "epoch": 53.86, + "learning_rate": 3.682974733517569e-05, + "loss": 2.0256, + "step": 137500 + }, + { + "epoch": 53.86, + "eval_bleu_bleu": 0.09184995516501912, + "eval_bleu_brevity_penalty": 0.9576952525812459, + "eval_bleu_length_ratio": 0.9585653792403024, + "eval_bleu_precisions": [ + 0.38087002968398376, + 0.14337321446326184, + 0.06040040194790137, + 0.025652033916496727 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228406, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.615989105584255, + "eval_chrf_word_order": 2, + "eval_loss": 2.1507408618927, + "eval_meteor": 0.29365730509150356, + "eval_runtime": 874.3492, + "eval_samples_per_second": 19.669, + "eval_scarebleu_bp": 0.9849975003962265, + "eval_scarebleu_counts": [ + 100528, + 36705, + 14912, + 6168 + ], + "eval_scarebleu_precisions": [ + 40.70717623525029, + 15.975435129853455, + 7.014440942659579, + 3.1547935676582513 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.788400219741181, + "eval_scarebleu_sys_len": 246954, + "eval_scarebleu_totals": [ + 246954, + 229759, + 212590, + 195512 + ], + "eval_steps_per_second": 0.615, + "eval_ter_num_edits": 158852, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.74475772660038, + "step": 137500 + }, + { + "epoch": 54.05, + "learning_rate": 3.678049743387288e-05, + "loss": 2.0201, + "step": 138000 + }, + { + "epoch": 54.05, + "eval_bleu_bleu": 0.09180554547311374, + "eval_bleu_brevity_penalty": 0.9547253336981143, + "eval_bleu_length_ratio": 0.9557199753230456, + "eval_bleu_precisions": [ + 0.38146385161244994, + 0.14341219666275595, + 0.06053068422168555, + 0.02581943971872519 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 227728, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.49961402948328, + "eval_chrf_word_order": 2, + "eval_loss": 2.1494736671447754, + "eval_meteor": 0.29345807058652124, + "eval_runtime": 893.727, + "eval_samples_per_second": 19.243, + "eval_scarebleu_bp": 0.9829994394324879, + "eval_scarebleu_counts": [ + 100487, + 36661, + 14896, + 6172 + ], + "eval_scarebleu_precisions": [ + 40.77196797870657, + 15.990596076173528, + 7.023267875244584, + 3.164836066414382 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.785305845091777, + "eval_scarebleu_sys_len": 246461, + "eval_scarebleu_totals": [ + 246461, + 229266, + 212095, + 195018 + ], + "eval_steps_per_second": 0.602, + "eval_ter_num_edits": 158887, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.76078564265075, + "step": 138000 + }, + { + "epoch": 54.25, + "learning_rate": 3.6731148835373074e-05, + "loss": 1.9976, + "step": 138500 + }, + { + "epoch": 54.25, + "eval_bleu_bleu": 0.09153533569927763, + "eval_bleu_brevity_penalty": 0.9514609896809342, + "eval_bleu_length_ratio": 0.9526017819446951, + "eval_bleu_precisions": [ + 0.3816375531422781, + 0.14361981028647694, + 0.0607433940715361, + 0.025729222428501463 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 226985, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.45789079065515, + "eval_chrf_word_order": 2, + "eval_loss": 2.1494147777557373, + "eval_meteor": 0.2929118213927763, + "eval_runtime": 891.5228, + "eval_samples_per_second": 19.291, + "eval_scarebleu_bp": 0.9799563184020512, + "eval_scarebleu_counts": [ + 100201, + 36520, + 14884, + 6155 + ], + "eval_scarebleu_precisions": [ + 40.77985609168457, + 15.981305548383709, + 7.042480103716181, + 3.168205730051371 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.761082336134677, + "eval_scarebleu_sys_len": 245712, + "eval_scarebleu_totals": [ + 245712, + 228517, + 211346, + 194274 + ], + "eval_steps_per_second": 0.603, + "eval_ter_num_edits": 159085, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.8514578534499, + "step": 138500 + }, + { + "epoch": 54.45, + "learning_rate": 3.668180023687328e-05, + "loss": 1.9974, + "step": 139000 + }, + { + "epoch": 54.45, + "eval_bleu_bleu": 0.09158251487303098, + "eval_bleu_brevity_penalty": 0.9562682911283197, + "eval_bleu_length_ratio": 0.9571972351738928, + "eval_bleu_precisions": [ + 0.3799631708172571, + 0.1432202385186239, + 0.06047169470440362, + 0.025564258710071765 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228080, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.61399300341489, + "eval_chrf_word_order": 2, + "eval_loss": 2.151350498199463, + "eval_meteor": 0.292960616867111, + "eval_runtime": 905.9101, + "eval_samples_per_second": 18.984, + "eval_scarebleu_bp": 0.9813510253269082, + "eval_scarebleu_counts": [ + 99970, + 36497, + 14868, + 6141 + ], + "eval_scarebleu_precisions": [ + 40.629127634065554, + 15.947304028663812, + 7.023444548894379, + 3.1554445677642127 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.742571470353983, + "eval_scarebleu_sys_len": 246055, + "eval_scarebleu_totals": [ + 246055, + 228860, + 211691, + 194616 + ], + "eval_steps_per_second": 0.594, + "eval_ter_num_edits": 159166, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.88855103059501, + "step": 139000 + }, + { + "epoch": 54.64, + "learning_rate": 3.6632451638373473e-05, + "loss": 2.0127, + "step": 139500 + }, + { + "epoch": 54.64, + "eval_bleu_bleu": 0.09204685026614043, + "eval_bleu_brevity_penalty": 0.953021936469064, + "eval_bleu_length_ratio": 0.9540916320783619, + "eval_bleu_precisions": [ + 0.38295944400457466, + 0.14438601917723476, + 0.060819143754339784, + 0.025876522440906845 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 227340, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.580622420402925, + "eval_chrf_word_order": 2, + "eval_loss": 2.1451799869537354, + "eval_meteor": 0.2943133926096102, + "eval_runtime": 891.9845, + "eval_samples_per_second": 19.281, + "eval_scarebleu_bp": 0.9801394061773301, + "eval_scarebleu_counts": [ + 100515, + 36701, + 14891, + 6165 + ], + "eval_scarebleu_precisions": [ + 40.900157472625395, + 16.05734986568196, + 7.044358977997909, + 3.1726508746018105 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.788312143300741, + "eval_scarebleu_sys_len": 245757, + "eval_scarebleu_totals": [ + 245757, + 228562, + 211389, + 194317 + ], + "eval_steps_per_second": 0.603, + "eval_ter_num_edits": 158519, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.59226355389272, + "step": 139500 + }, + { + "epoch": 54.84, + "learning_rate": 3.658310303987367e-05, + "loss": 2.0007, + "step": 140000 + }, + { + "epoch": 54.84, + "eval_bleu_bleu": 0.09216861773979945, + "eval_bleu_brevity_penalty": 0.9519141230366354, + "eval_bleu_length_ratio": 0.9530340483215055, + "eval_bleu_precisions": [ + 0.38285158176565914, + 0.1448118803390299, + 0.060959980906227784, + 0.026005293263894818 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 227088, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.59102353554792, + "eval_chrf_word_order": 2, + "eval_loss": 2.142103672027588, + "eval_meteor": 0.29398029108065515, + "eval_runtime": 887.8098, + "eval_samples_per_second": 19.371, + "eval_scarebleu_bp": 0.9825936737923394, + "eval_scarebleu_counts": [ + 100694, + 36939, + 15031, + 6233 + ], + "eval_scarebleu_precisions": [ + 40.87254070246508, + 16.118883254933106, + 7.090295008349293, + 3.1977713590913055 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.86284389065126, + "eval_scarebleu_sys_len": 246361, + "eval_scarebleu_totals": [ + 246361, + 229166, + 211994, + 194917 + ], + "eval_steps_per_second": 0.606, + "eval_ter_num_edits": 158702, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.67606665781315, + "step": 140000 + }, + { + "epoch": 55.03, + "learning_rate": 3.6533754441373866e-05, + "loss": 1.9997, + "step": 140500 + }, + { + "epoch": 55.03, + "eval_bleu_bleu": 0.09195417311223618, + "eval_bleu_brevity_penalty": 0.9536764034728623, + "eval_bleu_length_ratio": 0.954716949458408, + "eval_bleu_precisions": [ + 0.38237892821191355, + 0.14446441648358965, + 0.060828233247382645, + 0.025722997950109877 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 227489, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.66727537591338, + "eval_chrf_word_order": 2, + "eval_loss": 2.1442689895629883, + "eval_meteor": 0.294493504553735, + "eval_runtime": 890.9889, + "eval_samples_per_second": 19.302, + "eval_scarebleu_bp": 0.9801556790564163, + "eval_scarebleu_counts": [ + 100422, + 36825, + 14985, + 6183 + ], + "eval_scarebleu_precisions": [ + 40.86165013976994, + 16.111320143853415, + 7.08865909155416, + 3.1817503486391496 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.819678731772838, + "eval_scarebleu_sys_len": 245761, + "eval_scarebleu_totals": [ + 245761, + 228566, + 211394, + 194327 + ], + "eval_steps_per_second": 0.604, + "eval_ter_num_edits": 158749, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.69758985936649, + "step": 140500 + }, + { + "epoch": 55.23, + "learning_rate": 3.648440584287406e-05, + "loss": 1.9795, + "step": 141000 + }, + { + "epoch": 55.23, + "eval_bleu_bleu": 0.09184797860214314, + "eval_bleu_brevity_penalty": 0.9496288694586387, + "eval_bleu_length_ratio": 0.9508559293936939, + "eval_bleu_precisions": [ + 0.3830930091936673, + 0.14476487051878456, + 0.06106246715882901, + 0.025841696064664178 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 226569, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.610333205234376, + "eval_chrf_word_order": 2, + "eval_loss": 2.1434454917907715, + "eval_meteor": 0.29361218694294755, + "eval_runtime": 893.1977, + "eval_samples_per_second": 19.254, + "eval_scarebleu_bp": 0.9791340528841607, + "eval_scarebleu_counts": [ + 100422, + 36774, + 14967, + 6182 + ], + "eval_scarebleu_precisions": [ + 40.90342552238198, + 16.106694698114445, + 7.088594405660645, + 3.185432135661691 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.813488006210923, + "eval_scarebleu_sys_len": 245510, + "eval_scarebleu_totals": [ + 245510, + 228315, + 211142, + 194071 + ], + "eval_steps_per_second": 0.602, + "eval_ter_num_edits": 158673, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.66278638451429, + "step": 141000 + }, + { + "epoch": 55.42, + "learning_rate": 3.643515594157126e-05, + "loss": 1.9845, + "step": 141500 + }, + { + "epoch": 55.42, + "eval_bleu_bleu": 0.09267177974363285, + "eval_bleu_brevity_penalty": 0.957428392625882, + "eval_bleu_length_ratio": 0.958309376822968, + "eval_bleu_precisions": [ + 0.3820359543672951, + 0.14437603599336965, + 0.06103344467813106, + 0.02607339428803924 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228345, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.71516809091818, + "eval_chrf_word_order": 2, + "eval_loss": 2.1410973072052, + "eval_meteor": 0.2950861948755206, + "eval_runtime": 889.6033, + "eval_samples_per_second": 19.332, + "eval_scarebleu_bp": 0.9828777267303433, + "eval_scarebleu_counts": [ + 100633, + 36880, + 15003, + 6219 + ], + "eval_scarebleu_precisions": [ + 40.83617726665882, + 16.088223490202235, + 7.074684296398291, + 3.1893452585477426 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.845259207360712, + "eval_scarebleu_sys_len": 246431, + "eval_scarebleu_totals": [ + 246431, + 229236, + 212066, + 194993 + ], + "eval_steps_per_second": 0.605, + "eval_ter_num_edits": 158616, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.63668377837513, + "step": 141500 + }, + { + "epoch": 55.62, + "learning_rate": 3.6385807343071456e-05, + "loss": 1.9982, + "step": 142000 + }, + { + "epoch": 55.62, + "eval_bleu_bleu": 0.09220664019182924, + "eval_bleu_brevity_penalty": 0.9500431372057159, + "eval_bleu_length_ratio": 0.9512504249220451, + "eval_bleu_precisions": [ + 0.38267824920697247, + 0.14481925640193252, + 0.0613810209716755, + 0.026084426365124917 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 226663, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.74355496813639, + "eval_chrf_word_order": 2, + "eval_loss": 2.1437759399414062, + "eval_meteor": 0.2932058951329323, + "eval_runtime": 916.7062, + "eval_samples_per_second": 18.761, + "eval_scarebleu_bp": 0.9795574802197247, + "eval_scarebleu_counts": [ + 100338, + 36827, + 15017, + 6222 + ], + "eval_scarebleu_precisions": [ + 40.85190583598655, + 16.12256423502423, + 7.10874000577523, + 3.2043094924192483 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.84109890725552, + "eval_scarebleu_sys_len": 245614, + "eval_scarebleu_totals": [ + 245614, + 228419, + 211247, + 194176 + ], + "eval_steps_per_second": 0.587, + "eval_ter_num_edits": 158511, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.58860003022407, + "step": 142000 + }, + { + "epoch": 55.82, + "learning_rate": 3.633645874457165e-05, + "loss": 1.9943, + "step": 142500 + }, + { + "epoch": 55.82, + "eval_bleu_bleu": 0.09282966509144983, + "eval_bleu_brevity_penalty": 0.9543348505530518, + "eval_bleu_length_ratio": 0.955346463599394, + "eval_bleu_precisions": [ + 0.38182385267902247, + 0.14507422402159245, + 0.06157778191676497, + 0.026246212851906908 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 227639, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.78812850460614, + "eval_chrf_word_order": 2, + "eval_loss": 2.1401803493499756, + "eval_meteor": 0.2951305950097806, + "eval_runtime": 901.9929, + "eval_samples_per_second": 19.067, + "eval_scarebleu_bp": 0.9816841713663158, + "eval_scarebleu_counts": [ + 100428, + 36969, + 15127, + 6278 + ], + "eval_scarebleu_precisions": [ + 40.80166736411023, + 16.14775794742773, + 7.1431269773811215, + 3.2245472382302487 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.895786942120635, + "eval_scarebleu_sys_len": 246137, + "eval_scarebleu_totals": [ + 246137, + 228942, + 211770, + 194694 + ], + "eval_steps_per_second": 0.596, + "eval_ter_num_edits": 158622, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.63943142112662, + "step": 142500 + }, + { + "epoch": 56.01, + "learning_rate": 3.628711014607185e-05, + "loss": 1.9973, + "step": 143000 + }, + { + "epoch": 56.01, + "eval_bleu_bleu": 0.09294772573833016, + "eval_bleu_brevity_penalty": 0.9532328160601072, + "eval_bleu_length_ratio": 0.9542930766034774, + "eval_bleu_precisions": [ + 0.3828830017415167, + 0.14531882603131407, + 0.06163744871316673, + 0.026358853142720774 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 227388, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.725559259661324, + "eval_chrf_word_order": 2, + "eval_loss": 2.1370763778686523, + "eval_meteor": 0.29485642596980205, + "eval_runtime": 890.3735, + "eval_samples_per_second": 19.315, + "eval_scarebleu_bp": 0.98118441145248, + "eval_scarebleu_counts": [ + 100641, + 37032, + 15129, + 6285 + ], + "eval_scarebleu_precisions": [ + 40.90864747534693, + 16.183970736695816, + 7.148223220740195, + 3.2301999280464613 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.910196394606393, + "eval_scarebleu_sys_len": 246014, + "eval_scarebleu_totals": [ + 246014, + 228819, + 211647, + 194570 + ], + "eval_steps_per_second": 0.604, + "eval_ter_num_edits": 158613, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.6353099569994, + "step": 143000 + }, + { + "epoch": 56.21, + "learning_rate": 3.623776154757205e-05, + "loss": 1.9803, + "step": 143500 + }, + { + "epoch": 56.21, + "eval_bleu_bleu": 0.09316282437784996, + "eval_bleu_brevity_penalty": 0.9557819790564587, + "eval_bleu_length_ratio": 0.9567313947095631, + "eval_bleu_precisions": [ + 0.3820958112725853, + 0.14527882945714368, + 0.061772711543129855, + 0.026324732108470583 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 227969, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.86302914510016, + "eval_chrf_word_order": 2, + "eval_loss": 2.140497922897339, + "eval_meteor": 0.29564077830797303, + "eval_runtime": 880.9589, + "eval_samples_per_second": 19.522, + "eval_scarebleu_bp": 0.9826423742132848, + "eval_scarebleu_counts": [ + 100572, + 37085, + 15200, + 6310 + ], + "eval_scarebleu_precisions": [ + 40.82103152537007, + 16.18174519369224, + 7.169608407309227, + 3.237258744702901 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.934301216125077, + "eval_scarebleu_sys_len": 246373, + "eval_scarebleu_totals": [ + 246373, + 229178, + 212006, + 194918 + ], + "eval_steps_per_second": 0.611, + "eval_ter_num_edits": 158687, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.66919755093443, + "step": 143500 + }, + { + "epoch": 56.4, + "learning_rate": 3.618841294907225e-05, + "loss": 1.9697, + "step": 144000 + }, + { + "epoch": 56.4, + "eval_bleu_bleu": 0.09320593953744506, + "eval_bleu_brevity_penalty": 0.9545454662834784, + "eval_bleu_length_ratio": 0.9555479081245095, + "eval_bleu_precisions": [ + 0.3827095969466856, + 0.14563023772874978, + 0.061852150704487616, + 0.02637012331393436 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 227687, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.77279638766784, + "eval_chrf_word_order": 2, + "eval_loss": 2.1364097595214844, + "eval_meteor": 0.294989686224605, + "eval_runtime": 894.7492, + "eval_samples_per_second": 19.221, + "eval_scarebleu_bp": 0.9810218350774949, + "eval_scarebleu_counts": [ + 100610, + 37072, + 15165, + 6300 + ], + "eval_scarebleu_precisions": [ + 40.90269703301975, + 16.20428448415283, + 7.16655324940456, + 3.238541730923447 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.925443673394422, + "eval_scarebleu_sys_len": 245974, + "eval_scarebleu_totals": [ + 245974, + 228779, + 211608, + 194532 + ], + "eval_steps_per_second": 0.601, + "eval_ter_num_edits": 158586, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.6229455646177, + "step": 144000 + }, + { + "epoch": 56.6, + "learning_rate": 3.6139064350572445e-05, + "loss": 1.9753, + "step": 144500 + }, + { + "epoch": 56.6, + "eval_bleu_bleu": 0.09292937117939612, + "eval_bleu_brevity_penalty": 0.9554138088004179, + "eval_bleu_length_ratio": 0.956378866790611, + "eval_bleu_precisions": [ + 0.38291682208131295, + 0.14517537614504722, + 0.061576380133517974, + 0.026147753219601465 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 227885, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.82099450019943, + "eval_chrf_word_order": 2, + "eval_loss": 2.1318984031677246, + "eval_meteor": 0.2956912853215207, + "eval_runtime": 913.7886, + "eval_samples_per_second": 18.821, + "eval_scarebleu_bp": 0.9826667235498345, + "eval_scarebleu_counts": [ + 100812, + 36967, + 15096, + 6228 + ], + "eval_scarebleu_precisions": [ + 40.917448321488436, + 16.129834543423623, + 7.120250925642053, + 3.1948455670748284 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.877451501533006, + "eval_scarebleu_sys_len": 246379, + "eval_scarebleu_totals": [ + 246379, + 229184, + 212015, + 194939 + ], + "eval_steps_per_second": 0.589, + "eval_ter_num_edits": 158369, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.52357248510549, + "step": 144500 + }, + { + "epoch": 56.8, + "learning_rate": 3.608981444926964e-05, + "loss": 1.9833, + "step": 145000 + }, + { + "epoch": 56.8, + "eval_bleu_bleu": 0.09347586977549284, + "eval_bleu_brevity_penalty": 0.9564916560178641, + "eval_bleu_length_ratio": 0.957411269981828, + "eval_bleu_precisions": [ + 0.3834375862991001, + 0.1457740736526719, + 0.06185364846733409, + 0.026383537306423597 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228131, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.929848787717205, + "eval_chrf_word_order": 2, + "eval_loss": 2.132108211517334, + "eval_meteor": 0.2970114536623104, + "eval_runtime": 914.3186, + "eval_samples_per_second": 18.81, + "eval_scarebleu_bp": 0.9837942708488713, + "eval_scarebleu_counts": [ + 101007, + 37201, + 15220, + 6305 + ], + "eval_scarebleu_precisions": [ + 40.95038859630986, + 16.21227044129311, + 7.1693029477988075, + 3.2298053920589305 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.95451306803653, + "eval_scarebleu_sys_len": 246657, + "eval_scarebleu_totals": [ + 246657, + 229462, + 212294, + 195213 + ], + "eval_steps_per_second": 0.588, + "eval_ter_num_edits": 158264, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.47548873695442, + "step": 145000 + }, + { + "epoch": 56.99, + "learning_rate": 3.604046585076984e-05, + "loss": 1.9874, + "step": 145500 + }, + { + "epoch": 56.99, + "eval_bleu_bleu": 0.09270640083784529, + "eval_bleu_brevity_penalty": 0.9545981136015189, + "eval_bleu_length_ratio": 0.9555982692557884, + "eval_bleu_precisions": [ + 0.3828036135424398, + 0.1454699198115, + 0.06137247600132407, + 0.02602757595866442 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 227699, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.79741707136206, + "eval_chrf_word_order": 2, + "eval_loss": 2.130342960357666, + "eval_meteor": 0.29557876359856, + "eval_runtime": 884.6222, + "eval_samples_per_second": 19.441, + "eval_scarebleu_bp": 0.9796226073034785, + "eval_scarebleu_counts": [ + 100546, + 36971, + 15060, + 6223 + ], + "eval_scarebleu_precisions": [ + 40.93392500916012, + 16.184472607087354, + 7.128555402507775, + 3.2046099418607645 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.86546858904399, + "eval_scarebleu_sys_len": 245630, + "eval_scarebleu_totals": [ + 245630, + 228435, + 211263, + 194189 + ], + "eval_steps_per_second": 0.608, + "eval_ter_num_edits": 158578, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.61928204094905, + "step": 145500 + }, + { + "epoch": 57.19, + "learning_rate": 3.5991117252270035e-05, + "loss": 1.9633, + "step": 146000 + }, + { + "epoch": 57.19, + "eval_bleu_bleu": 0.09348058733414458, + "eval_bleu_brevity_penalty": 0.9549972696708325, + "eval_bleu_length_ratio": 0.9559801745013199, + "eval_bleu_precisions": [ + 0.3841827999473199, + 0.14593888743797337, + 0.06194360867272558, + 0.0264345400741505 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 227790, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.919649425568274, + "eval_chrf_word_order": 2, + "eval_loss": 2.130845785140991, + "eval_meteor": 0.2966280407940341, + "eval_runtime": 876.967, + "eval_samples_per_second": 19.611, + "eval_scarebleu_bp": 0.9825003248045555, + "eval_scarebleu_counts": [ + 101068, + 37219, + 15207, + 6312 + ], + "eval_scarebleu_precisions": [ + 41.028180792244804, + 16.242695609292014, + 7.1740945695401726, + 3.238700209858743 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.959790583452289, + "eval_scarebleu_sys_len": 246338, + "eval_scarebleu_totals": [ + 246338, + 229143, + 211971, + 194893 + ], + "eval_steps_per_second": 0.613, + "eval_ter_num_edits": 158117, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.40817148954292, + "step": 146000 + }, + { + "epoch": 57.38, + "learning_rate": 3.594176865377024e-05, + "loss": 1.9661, + "step": 146500 + }, + { + "epoch": 57.38, + "eval_bleu_bleu": 0.0936634539825762, + "eval_bleu_brevity_penalty": 0.9584648270817812, + "eval_bleu_length_ratio": 0.9593040091657259, + "eval_bleu_precisions": [ + 0.3839059943477614, + 0.14621996622308847, + 0.06193268701055981, + 0.02623158061075337 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228582, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.92280033231988, + "eval_chrf_word_order": 2, + "eval_loss": 2.128574848175049, + "eval_meteor": 0.29791782042237086, + "eval_runtime": 890.7768, + "eval_samples_per_second": 19.307, + "eval_scarebleu_bp": 0.9833523239359755, + "eval_scarebleu_counts": [ + 101101, + 37322, + 15231, + 6315 + ], + "eval_scarebleu_precisions": [ + 41.006619400684656, + 16.272732425562342, + 7.178305314801985, + 3.2366689218279108 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.97280881096937, + "eval_scarebleu_sys_len": 246548, + "eval_scarebleu_totals": [ + 246548, + 229353, + 212181, + 195108 + ], + "eval_steps_per_second": 0.604, + "eval_ter_num_edits": 158213, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.45213377356676, + "step": 146500 + }, + { + "epoch": 57.58, + "learning_rate": 3.5892420055270435e-05, + "loss": 1.9651, + "step": 147000 + }, + { + "epoch": 57.58, + "eval_bleu_bleu": 0.09371962746430165, + "eval_bleu_brevity_penalty": 0.9543567916669567, + "eval_bleu_length_ratio": 0.9553674474040935, + "eval_bleu_precisions": [ + 0.38417441267944685, + 0.14656757694263217, + 0.062201872833566145, + 0.026552739527837824 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 227644, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.94982746336811, + "eval_chrf_word_order": 2, + "eval_loss": 2.1283161640167236, + "eval_meteor": 0.29704904407922184, + "eval_runtime": 888.41, + "eval_samples_per_second": 19.358, + "eval_scarebleu_bp": 0.9812047316761033, + "eval_scarebleu_counts": [ + 100987, + 37305, + 15263, + 6350 + ], + "eval_scarebleu_precisions": [ + 41.048455607087256, + 16.302922770338775, + 7.211365826923441, + 3.263590154750708 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.992044872348911, + "eval_scarebleu_sys_len": 246019, + "eval_scarebleu_totals": [ + 246019, + 228824, + 211652, + 194571 + ], + "eval_steps_per_second": 0.606, + "eval_ter_num_edits": 158242, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.46541404686563, + "step": 147000 + }, + { + "epoch": 57.78, + "learning_rate": 3.5843071456770624e-05, + "loss": 1.9719, + "step": 147500 + }, + { + "epoch": 57.78, + "eval_bleu_bleu": 0.09401468941552492, + "eval_bleu_brevity_penalty": 0.955326130123532, + "eval_bleu_length_ratio": 0.9562949315718129, + "eval_bleu_precisions": [ + 0.38428016588769665, + 0.14656097213651684, + 0.06233205175906404, + 0.02671766539169854 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 227865, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.94781967177925, + "eval_chrf_word_order": 2, + "eval_loss": 2.1256425380706787, + "eval_meteor": 0.2970921550545355, + "eval_runtime": 882.9736, + "eval_samples_per_second": 19.477, + "eval_scarebleu_bp": 0.9791299806151322, + "eval_scarebleu_counts": [ + 100893, + 37169, + 15182, + 6278 + ], + "eval_scarebleu_precisions": [ + 41.09543845643133, + 16.279772593883862, + 7.190387557247932, + 3.2349985829490118 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.93597315125091, + "eval_scarebleu_sys_len": 245509, + "eval_scarebleu_totals": [ + 245509, + 228314, + 211143, + 194065 + ], + "eval_steps_per_second": 0.609, + "eval_ter_num_edits": 158088, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.39489121624406, + "step": 147500 + }, + { + "epoch": 57.97, + "learning_rate": 3.579372285827083e-05, + "loss": 1.9733, + "step": 148000 + }, + { + "epoch": 57.97, + "eval_bleu_bleu": 0.09327633826384595, + "eval_bleu_brevity_penalty": 0.9545191416323252, + "eval_bleu_length_ratio": 0.95552272755887, + "eval_bleu_precisions": [ + 0.3832950487743817, + 0.145829176287259, + 0.0618443649003745, + 0.026379685939911048 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 227681, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.85552307288532, + "eval_chrf_word_order": 2, + "eval_loss": 2.1246635913848877, + "eval_meteor": 0.29663138120750626, + "eval_runtime": 885.5245, + "eval_samples_per_second": 19.421, + "eval_scarebleu_bp": 0.9838753411690799, + "eval_scarebleu_counts": [ + 100994, + 37275, + 15260, + 6321 + ], + "eval_scarebleu_precisions": [ + 40.941798384121746, + 16.243104034303343, + 7.187636887743808, + 3.237902048468643 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.973913184884568, + "eval_scarebleu_sys_len": 246677, + "eval_scarebleu_totals": [ + 246677, + 229482, + 212309, + 195219 + ], + "eval_steps_per_second": 0.608, + "eval_ter_num_edits": 158299, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.49151665300477, + "step": 148000 + }, + { + "epoch": 58.17, + "learning_rate": 3.5744374259771024e-05, + "loss": 1.9418, + "step": 148500 + }, + { + "epoch": 58.17, + "eval_bleu_bleu": 0.09341099267426081, + "eval_bleu_brevity_penalty": 0.954628823315288, + "eval_bleu_length_ratio": 0.9556276465823678, + "eval_bleu_precisions": [ + 0.38324857491677866, + 0.14585461092294463, + 0.06194433956897042, + 0.02647594307785674 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 227706, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.92198395467786, + "eval_chrf_word_order": 2, + "eval_loss": 2.1282975673675537, + "eval_meteor": 0.29628102236356146, + "eval_runtime": 903.7977, + "eval_samples_per_second": 19.029, + "eval_scarebleu_bp": 0.9787226717038893, + "eval_scarebleu_counts": [ + 100554, + 37023, + 15125, + 6294 + ], + "eval_scarebleu_precisions": [ + 40.97404740657433, + 16.22293110852095, + 7.166819874716881, + 3.2449487788908193 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.913216724187732, + "eval_scarebleu_sys_len": 245409, + "eval_scarebleu_totals": [ + 245409, + 228214, + 211042, + 193963 + ], + "eval_steps_per_second": 0.595, + "eval_ter_num_edits": 158412, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.5432639248245, + "step": 148500 + }, + { + "epoch": 58.36, + "learning_rate": 3.569512435846822e-05, + "loss": 1.958, + "step": 149000 + }, + { + "epoch": 58.36, + "eval_bleu_bleu": 0.09349825180472493, + "eval_bleu_brevity_penalty": 0.9557162438669801, + "eval_bleu_length_ratio": 0.9566684432954645, + "eval_bleu_precisions": [ + 0.3844635321161287, + 0.14610526715347863, + 0.061942468711098715, + 0.026326223138529854 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 227954, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.90882076472852, + "eval_chrf_word_order": 2, + "eval_loss": 2.126175880432129, + "eval_meteor": 0.2970561813889906, + "eval_runtime": 897.386, + "eval_samples_per_second": 19.165, + "eval_scarebleu_bp": 0.984458856632071, + "eval_scarebleu_counts": [ + 101340, + 37290, + 15261, + 6303 + ], + "eval_scarebleu_precisions": [ + 41.05809473262, + 16.23945023647148, + 7.183202010788218, + 3.2262027240759794 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.975960429463692, + "eval_scarebleu_sys_len": 246821, + "eval_scarebleu_totals": [ + 246821, + 229626, + 212454, + 195369 + ], + "eval_steps_per_second": 0.6, + "eval_ter_num_edits": 158200, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.4461805476052, + "step": 149000 + }, + { + "epoch": 58.56, + "learning_rate": 3.564577575996842e-05, + "loss": 1.9615, + "step": 149500 + }, + { + "epoch": 58.56, + "eval_bleu_bleu": 0.09341123662990738, + "eval_bleu_brevity_penalty": 0.9542207493549093, + "eval_bleu_length_ratio": 0.9552373478149564, + "eval_bleu_precisions": [ + 0.3832426091655573, + 0.14606164871826555, + 0.06211482238493182, + 0.026411667896260146 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 227613, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 32.96275994224102, + "eval_chrf_word_order": 2, + "eval_loss": 2.1282684803009033, + "eval_meteor": 0.29568648260774466, + "eval_runtime": 884.5449, + "eval_samples_per_second": 19.443, + "eval_scarebleu_bp": 0.981034029205137, + "eval_scarebleu_counts": [ + 100821, + 37229, + 15263, + 6333 + ], + "eval_scarebleu_precisions": [ + 40.98797855084012, + 16.272696278553383, + 7.212865298098371, + 3.2556226706078912 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.974848863502727, + "eval_scarebleu_sys_len": 245977, + "eval_scarebleu_totals": [ + 245977, + 228782, + 211608, + 194525 + ], + "eval_steps_per_second": 0.608, + "eval_ter_num_edits": 158385, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.53089953244279, + "step": 149500 + }, + { + "epoch": 58.75, + "learning_rate": 3.5596427161468614e-05, + "loss": 1.9539, + "step": 150000 + }, + { + "epoch": 58.75, + "eval_bleu_bleu": 0.09381489714303094, + "eval_bleu_brevity_penalty": 0.9548876265640622, + "eval_bleu_length_ratio": 0.9558752554778223, + "eval_bleu_precisions": [ + 0.3847781704827344, + 0.14685852685567743, + 0.06236524670516884, + 0.026437837347484918 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 227765, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.04137460269115, + "eval_chrf_word_order": 2, + "eval_loss": 2.120607852935791, + "eval_meteor": 0.2975228263789542, + "eval_runtime": 883.3247, + "eval_samples_per_second": 19.47, + "eval_scarebleu_bp": 0.9786656354954731, + "eval_scarebleu_counts": [ + 100922, + 37273, + 15230, + 6278 + ], + "eval_scarebleu_precisions": [ + 41.12634731759001, + 16.33347940403155, + 7.217051765642474, + 3.236833286071511 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 10.953529669120973, + "eval_scarebleu_sys_len": 245395, + "eval_scarebleu_totals": [ + 245395, + 228200, + 211028, + 193955 + ], + "eval_steps_per_second": 0.609, + "eval_ter_num_edits": 158093, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.39718091853698, + "step": 150000 + }, + { + "epoch": 58.95, + "learning_rate": 3.554707856296881e-05, + "loss": 1.9686, + "step": 150500 + }, + { + "epoch": 58.95, + "eval_bleu_bleu": 0.09428861917550069, + "eval_bleu_brevity_penalty": 0.9519800970327844, + "eval_bleu_length_ratio": 0.953096999735604, + "eval_bleu_precisions": [ + 0.38615958397731426, + 0.1474503115650666, + 0.06283885092893793, + 0.026895825626725094 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 227103, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.02620077345346, + "eval_chrf_word_order": 2, + "eval_loss": 2.1201632022857666, + "eval_meteor": 0.2980247809530792, + "eval_runtime": 893.0328, + "eval_samples_per_second": 19.258, + "eval_scarebleu_bp": 0.9784537588447995, + "eval_scarebleu_counts": [ + 101118, + 37427, + 15357, + 6399 + ], + "eval_scarebleu_precisions": [ + 41.214952128244946, + 16.404702210845592, + 7.279026998331564, + 3.3001036600774616 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.045778286300349, + "eval_scarebleu_sys_len": 245343, + "eval_scarebleu_totals": [ + 245343, + 228148, + 210976, + 193903 + ], + "eval_steps_per_second": 0.602, + "eval_ter_num_edits": 157792, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.25934084050391, + "step": 150500 + }, + { + "epoch": 59.15, + "learning_rate": 3.549782866166601e-05, + "loss": 1.9437, + "step": 151000 + }, + { + "epoch": 59.15, + "eval_bleu_bleu": 0.09384711791636435, + "eval_bleu_brevity_penalty": 0.9577521155610426, + "eval_bleu_length_ratio": 0.9586199371325211, + "eval_bleu_precisions": [ + 0.3842893979922861, + 0.14666893913570428, + 0.06214508765239975, + 0.026318911315606625 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228419, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.106984318364304, + "eval_chrf_word_order": 2, + "eval_loss": 2.1196553707122803, + "eval_meteor": 0.2984543631131828, + "eval_runtime": 902.1587, + "eval_samples_per_second": 19.063, + "eval_scarebleu_bp": 0.9841833494212449, + "eval_scarebleu_counts": [ + 101329, + 37482, + 15325, + 6328 + ], + "eval_scarebleu_precisions": [ + 41.06495159126738, + 16.327899702907327, + 7.215669656519999, + 3.2400438286586177 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.012433653571566, + "eval_scarebleu_sys_len": 246753, + "eval_scarebleu_totals": [ + 246753, + 229558, + 212385, + 195306 + ], + "eval_steps_per_second": 0.596, + "eval_ter_num_edits": 158111, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.40542384679144, + "step": 151000 + }, + { + "epoch": 59.34, + "learning_rate": 3.5448480063166205e-05, + "loss": 1.9386, + "step": 151500 + }, + { + "epoch": 59.34, + "eval_bleu_bleu": 0.09434724582394613, + "eval_bleu_brevity_penalty": 0.9574240173044095, + "eval_bleu_length_ratio": 0.9583051800620281, + "eval_bleu_precisions": [ + 0.3847659671373016, + 0.1470667632809059, + 0.06254027331728415, + 0.02664579459850467 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228344, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.138400203344034, + "eval_chrf_word_order": 2, + "eval_loss": 2.119170904159546, + "eval_meteor": 0.29836275960818764, + "eval_runtime": 889.8786, + "eval_samples_per_second": 19.326, + "eval_scarebleu_bp": 0.9827235364028168, + "eval_scarebleu_counts": [ + 101382, + 37519, + 15426, + 6413 + ], + "eval_scarebleu_precisions": [ + 41.14646114134736, + 16.369689089782632, + 7.27559144247821, + 3.2896120484028994 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.073319589608897, + "eval_scarebleu_sys_len": 246393, + "eval_scarebleu_totals": [ + 246393, + 229198, + 212024, + 194947 + ], + "eval_steps_per_second": 0.605, + "eval_ter_num_edits": 157949, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.33123749250122, + "step": 151500 + }, + { + "epoch": 59.54, + "learning_rate": 3.539913146466641e-05, + "loss": 1.95, + "step": 152000 + }, + { + "epoch": 59.54, + "eval_bleu_bleu": 0.09420621625451771, + "eval_bleu_brevity_penalty": 0.9547516531684901, + "eval_bleu_length_ratio": 0.9557451558886851, + "eval_bleu_precisions": [ + 0.38476029051437205, + 0.14665691392093627, + 0.06263800476779001, + 0.026817967868343003 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 227734, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.11107487846355, + "eval_chrf_word_order": 2, + "eval_loss": 2.1237027645111084, + "eval_meteor": 0.29777695963855666, + "eval_runtime": 893.7624, + "eval_samples_per_second": 19.242, + "eval_scarebleu_bp": 0.9822405260357506, + "eval_scarebleu_counts": [ + 101171, + 37361, + 15362, + 6390 + ], + "eval_scarebleu_precisions": [ + 41.08066624978682, + 16.30922083647999, + 7.249406579301297, + 3.2798328773732592 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.0350438869428, + "eval_scarebleu_sys_len": 246274, + "eval_scarebleu_totals": [ + 246274, + 229079, + 211907, + 194827 + ], + "eval_steps_per_second": 0.602, + "eval_ter_num_edits": 157966, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.3390224802971, + "step": 152000 + }, + { + "epoch": 59.73, + "learning_rate": 3.5349782866166604e-05, + "loss": 1.9508, + "step": 152500 + }, + { + "epoch": 59.73, + "eval_bleu_bleu": 0.09459288098333218, + "eval_bleu_brevity_penalty": 0.957743367611853, + "eval_bleu_length_ratio": 0.9586115436106413, + "eval_bleu_precisions": [ + 0.3844678811121764, + 0.14713429472308756, + 0.06270193392799171, + 0.026827628672628362 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228417, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.2063743407628, + "eval_chrf_word_order": 2, + "eval_loss": 2.1193974018096924, + "eval_meteor": 0.2989334775896594, + "eval_runtime": 885.4282, + "eval_samples_per_second": 19.423, + "eval_scarebleu_bp": 0.9827154204751549, + "eval_scarebleu_counts": [ + 101222, + 37538, + 15405, + 6405 + ], + "eval_scarebleu_precisions": [ + 41.081857697724345, + 16.378121782230057, + 7.265652635302441, + 3.2855589297439263 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.063111421455268, + "eval_scarebleu_sys_len": 246391, + "eval_scarebleu_totals": [ + 246391, + 229196, + 212025, + 194944 + ], + "eval_steps_per_second": 0.608, + "eval_ter_num_edits": 158023, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.36512508643627, + "step": 152500 + }, + { + "epoch": 59.93, + "learning_rate": 3.5300532964863795e-05, + "loss": 1.9448, + "step": 153000 + }, + { + "epoch": 59.93, + "eval_bleu_bleu": 0.09414559023031903, + "eval_bleu_brevity_penalty": 0.9570914392412777, + "eval_bleu_length_ratio": 0.9579862262305953, + "eval_bleu_precisions": [ + 0.38520072896770463, + 0.14701548753274934, + 0.06225504352489789, + 0.026555927450359583 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228268, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.12107686127237, + "eval_chrf_word_order": 2, + "eval_loss": 2.113703727722168, + "eval_meteor": 0.2987442836983213, + "eval_runtime": 892.8562, + "eval_samples_per_second": 19.262, + "eval_scarebleu_bp": 0.98382264619647, + "eval_scarebleu_counts": [ + 101485, + 37540, + 15344, + 6367 + ], + "eval_scarebleu_precisions": [ + 41.143012356890345, + 16.359508256017154, + 7.227678466285123, + 3.261498742425096 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.041737236762001, + "eval_scarebleu_sys_len": 246664, + "eval_scarebleu_totals": [ + 246664, + 229469, + 212295, + 195217 + ], + "eval_steps_per_second": 0.603, + "eval_ter_num_edits": 157887, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.30284518406917, + "step": 153000 + }, + { + "epoch": 60.13, + "learning_rate": 3.5251184366364e-05, + "loss": 1.9391, + "step": 153500 + }, + { + "epoch": 60.13, + "eval_bleu_bleu": 0.09551464548181195, + "eval_bleu_brevity_penalty": 0.9558038898686001, + "eval_bleu_length_ratio": 0.9567523785142626, + "eval_bleu_precisions": [ + 0.3860835007500855, + 0.1481456881378126, + 0.06345451634395385, + 0.027477163713381242 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 227974, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.22391960090539, + "eval_chrf_word_order": 2, + "eval_loss": 2.1168127059936523, + "eval_meteor": 0.2993217929813263, + "eval_runtime": 906.1551, + "eval_samples_per_second": 18.979, + "eval_scarebleu_bp": 0.9812575623614842, + "eval_scarebleu_counts": [ + 101441, + 37699, + 15513, + 6501 + ], + "eval_scarebleu_precisions": [ + 41.23081550367432, + 16.474171571904893, + 7.328999461415626, + 3.3408705483323913 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.14334248623174, + "eval_scarebleu_sys_len": 246032, + "eval_scarebleu_totals": [ + 246032, + 228837, + 211666, + 194590 + ], + "eval_steps_per_second": 0.594, + "eval_ter_num_edits": 157733, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.23232235344761, + "step": 153500 + }, + { + "epoch": 60.32, + "learning_rate": 3.5201835767864194e-05, + "loss": 1.9275, + "step": 154000 + }, + { + "epoch": 60.32, + "eval_bleu_bleu": 0.09556023796566136, + "eval_bleu_brevity_penalty": 0.9588668789007414, + "eval_bleu_length_ratio": 0.9596901111721973, + "eval_bleu_precisions": [ + 0.38497161898598004, + 0.14782082381702202, + 0.06322046109510086, + 0.027419127393744535 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228674, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.223132584285864, + "eval_chrf_word_order": 2, + "eval_loss": 2.1147568225860596, + "eval_meteor": 0.29950834758228, + "eval_runtime": 887.3833, + "eval_samples_per_second": 19.381, + "eval_scarebleu_bp": 0.983972617018406, + "eval_scarebleu_counts": [ + 101421, + 37721, + 15499, + 6500 + ], + "eval_scarebleu_precisions": [ + 41.11089942886328, + 16.435735884900613, + 7.299280385803632, + 3.328877758487358 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.138174538597962, + "eval_scarebleu_sys_len": 246701, + "eval_scarebleu_totals": [ + 246701, + 229506, + 212336, + 195261 + ], + "eval_steps_per_second": 0.606, + "eval_ter_num_edits": 157841, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.28177992297441, + "step": 154000 + }, + { + "epoch": 60.52, + "learning_rate": 3.515248716936439e-05, + "loss": 1.9312, + "step": 154500 + }, + { + "epoch": 60.52, + "eval_bleu_bleu": 0.09469366607691887, + "eval_bleu_brevity_penalty": 0.9570214093150639, + "eval_bleu_length_ratio": 0.9579190780555568, + "eval_bleu_precisions": [ + 0.384675709303752, + 0.14763784191000534, + 0.06286392119446092, + 0.026847459160536272 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228252, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.26743698873064, + "eval_chrf_word_order": 2, + "eval_loss": 2.1209371089935303, + "eval_meteor": 0.29874336240130306, + "eval_runtime": 901.3452, + "eval_samples_per_second": 19.08, + "eval_scarebleu_bp": 0.9843413700470165, + "eval_scarebleu_counts": [ + 101396, + 37702, + 15456, + 6405 + ], + "eval_scarebleu_precisions": [ + 41.0856105546371, + 16.42094626671951, + 7.276014009716416, + 3.2788647602666092 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.08720243338128, + "eval_scarebleu_sys_len": 246792, + "eval_scarebleu_totals": [ + 246792, + 229597, + 212424, + 195342 + ], + "eval_steps_per_second": 0.597, + "eval_ter_num_edits": 157958, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.33535895662845, + "step": 154500 + }, + { + "epoch": 60.71, + "learning_rate": 3.5103138570864594e-05, + "loss": 1.938, + "step": 155000 + }, + { + "epoch": 60.71, + "eval_bleu_bleu": 0.09523275442733467, + "eval_bleu_brevity_penalty": 0.9584954234278611, + "eval_bleu_length_ratio": 0.9593333864923053, + "eval_bleu_precisions": [ + 0.38607719531561013, + 0.14788499200544955, + 0.06294051927859096, + 0.02711793621500206 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228589, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.200568846589114, + "eval_chrf_word_order": 2, + "eval_loss": 2.11315655708313, + "eval_meteor": 0.2996999609557199, + "eval_runtime": 908.3945, + "eval_samples_per_second": 18.932, + "eval_scarebleu_bp": 0.9870562894952948, + "eval_scarebleu_counts": [ + 101955, + 37844, + 15509, + 6477 + ], + "eval_scarebleu_precisions": [ + 41.20009860059888, + 16.434762971841508, + 7.278008766084451, + 3.304406385355924 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.15023067198716, + "eval_scarebleu_sys_len": 247463, + "eval_scarebleu_totals": [ + 247463, + 230268, + 213094, + 196011 + ], + "eval_steps_per_second": 0.592, + "eval_ter_num_edits": 157648, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.19339741446818, + "step": 155000 + }, + { + "epoch": 60.91, + "learning_rate": 3.505378997236478e-05, + "loss": 1.9463, + "step": 155500 + }, + { + "epoch": 60.91, + "eval_bleu_bleu": 0.09465177838309735, + "eval_bleu_brevity_penalty": 0.9548218351897959, + "eval_bleu_length_ratio": 0.9558123040637236, + "eval_bleu_precisions": [ + 0.3857826564215148, + 0.14733917503740115, + 0.06279441344826338, + 0.027054767332403345 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 227750, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.20241337094825, + "eval_chrf_word_order": 2, + "eval_loss": 2.1102170944213867, + "eval_meteor": 0.29830965830953154, + "eval_runtime": 885.1854, + "eval_samples_per_second": 19.429, + "eval_scarebleu_bp": 0.9811681549818749, + "eval_scarebleu_counts": [ + 101459, + 37567, + 15355, + 6400 + ], + "eval_scarebleu_precisions": [ + 41.24181943823422, + 16.418066997355943, + 7.255141913505289, + 3.289524406729133 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.062496859926739, + "eval_scarebleu_sys_len": 246010, + "eval_scarebleu_totals": [ + 246010, + 228815, + 211643, + 194557 + ], + "eval_steps_per_second": 0.608, + "eval_ter_num_edits": 157832, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.27765845884718, + "step": 155500 + }, + { + "epoch": 61.1, + "learning_rate": 3.500444137386498e-05, + "loss": 1.9281, + "step": 156000 + }, + { + "epoch": 61.1, + "eval_bleu_bleu": 0.09533901987756373, + "eval_bleu_brevity_penalty": 0.9581019734375871, + "eval_bleu_length_ratio": 0.9589556780077136, + "eval_bleu_precisions": [ + 0.3854327590055099, + 0.14783913224548517, + 0.06322143986649016, + 0.02721656935707913 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228499, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.29601532019415, + "eval_chrf_word_order": 2, + "eval_loss": 2.11220383644104, + "eval_meteor": 0.2994521714865379, + "eval_runtime": 876.5143, + "eval_samples_per_second": 19.621, + "eval_scarebleu_bp": 0.9851068142470663, + "eval_scarebleu_counts": [ + 101706, + 37865, + 15572, + 6510 + ], + "eval_scarebleu_precisions": [ + 41.17968588676862, + 16.478375532016745, + 7.324070851402071, + 3.329395338846526 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.172803367906523, + "eval_scarebleu_sys_len": 246981, + "eval_scarebleu_totals": [ + 246981, + 229786, + 212614, + 195531 + ], + "eval_steps_per_second": 0.614, + "eval_ter_num_edits": 157756, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.24285498399499, + "step": 156000 + }, + { + "epoch": 61.3, + "learning_rate": 3.495509277536518e-05, + "loss": 1.9181, + "step": 156500 + }, + { + "epoch": 61.3, + "eval_bleu_bleu": 0.09517728212181895, + "eval_bleu_brevity_penalty": 0.960490987500557, + "eval_bleu_length_ratio": 0.9612513062418425, + "eval_bleu_precisions": [ + 0.3855950333120858, + 0.1476887057412993, + 0.06285858103353519, + 0.02693498452012384 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229046, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.32810912464366, + "eval_chrf_word_order": 2, + "eval_loss": 2.110365390777588, + "eval_meteor": 0.30051316093268554, + "eval_runtime": 909.2517, + "eval_samples_per_second": 18.914, + "eval_scarebleu_bp": 0.9876258635383938, + "eval_scarebleu_counts": [ + 101938, + 37918, + 15525, + 6475 + ], + "eval_scarebleu_precisions": [ + 41.16977108608908, + 16.456822433151483, + 7.2806655536588565, + 3.300910490522946 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.156417821920163, + "eval_scarebleu_sys_len": 247604, + "eval_scarebleu_totals": [ + 247604, + 230409, + 213236, + 196158 + ], + "eval_steps_per_second": 0.592, + "eval_ter_num_edits": 157618, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.17965920071072, + "step": 156500 + }, + { + "epoch": 61.5, + "learning_rate": 3.490584287406238e-05, + "loss": 1.9173, + "step": 157000 + }, + { + "epoch": 61.5, + "eval_bleu_bleu": 0.095173428640039, + "eval_bleu_brevity_penalty": 0.9545937264260639, + "eval_bleu_length_ratio": 0.9555940724948485, + "eval_bleu_precisions": [ + 0.386964312378677, + 0.14820691391571617, + 0.06330331697174393, + 0.027215900711311785 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 227698, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.21382459956928, + "eval_chrf_word_order": 2, + "eval_loss": 2.1118085384368896, + "eval_meteor": 0.29979450180419676, + "eval_runtime": 889.3591, + "eval_samples_per_second": 19.338, + "eval_scarebleu_bp": 0.9830034962717886, + "eval_scarebleu_counts": [ + 101738, + 37786, + 15541, + 6474 + ], + "eval_scarebleu_precisions": [ + 41.279385868815474, + 16.48122058560543, + 7.327445978886621, + 3.319829752320394 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.149434022514816, + "eval_scarebleu_sys_len": 246462, + "eval_scarebleu_totals": [ + 246462, + 229267, + 212093, + 195010 + ], + "eval_steps_per_second": 0.605, + "eval_ter_num_edits": 157467, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.11051019146491, + "step": 157000 + }, + { + "epoch": 61.69, + "learning_rate": 3.485649427556257e-05, + "loss": 1.9291, + "step": 157500 + }, + { + "epoch": 61.69, + "eval_bleu_bleu": 0.09543498464686379, + "eval_bleu_brevity_penalty": 0.9592032596922077, + "eval_bleu_length_ratio": 0.9600132617645701, + "eval_bleu_precisions": [ + 0.3851830155933745, + 0.14802227306245155, + 0.06327805098870347, + 0.02716067481618476 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228751, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.364871378123624, + "eval_chrf_word_order": 2, + "eval_loss": 2.108616590499878, + "eval_meteor": 0.29999226140773805, + "eval_runtime": 881.5501, + "eval_samples_per_second": 19.509, + "eval_scarebleu_bp": 0.9837415716731688, + "eval_scarebleu_counts": [ + 101527, + 37851, + 15552, + 6488 + ], + "eval_scarebleu_precisions": [ + 41.163377175199884, + 16.496476341147705, + 7.3262765160615615, + 3.323821575126667 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.155443050769385, + "eval_scarebleu_sys_len": 246644, + "eval_scarebleu_totals": [ + 246644, + 229449, + 212277, + 195197 + ], + "eval_steps_per_second": 0.61, + "eval_ter_num_edits": 157728, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.2300326511547, + "step": 157500 + }, + { + "epoch": 61.89, + "learning_rate": 3.480714567706277e-05, + "loss": 1.9373, + "step": 158000 + }, + { + "epoch": 61.89, + "eval_bleu_bleu": 0.09533418698357059, + "eval_bleu_brevity_penalty": 0.9545323040405811, + "eval_bleu_length_ratio": 0.9555353178416898, + "eval_bleu_precisions": [ + 0.3865445090564115, + 0.148368798369511, + 0.06349378769539535, + 0.027324915194626914 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 227684, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.3171864210862, + "eval_chrf_word_order": 2, + "eval_loss": 2.105787515640259, + "eval_meteor": 0.29977298864592217, + "eval_runtime": 910.6653, + "eval_samples_per_second": 18.885, + "eval_scarebleu_bp": 0.98231766071564, + "eval_scarebleu_counts": [ + 101672, + 37783, + 15532, + 6520 + ], + "eval_scarebleu_precisions": [ + 41.2809133836528, + 16.492068896280195, + 7.32900790373953, + 3.346198062079159 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.166248022211402, + "eval_scarebleu_sys_len": 246293, + "eval_scarebleu_totals": [ + 246293, + 229098, + 211925, + 194848 + ], + "eval_steps_per_second": 0.591, + "eval_ter_num_edits": 157609, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.1755377365835, + "step": 158000 + }, + { + "epoch": 62.08, + "learning_rate": 3.475779707856297e-05, + "loss": 1.9196, + "step": 158500 + }, + { + "epoch": 62.08, + "eval_bleu_bleu": 0.09550871517407127, + "eval_bleu_brevity_penalty": 0.9552515974737722, + "eval_bleu_length_ratio": 0.9562235866358345, + "eval_bleu_precisions": [ + 0.38692900530178015, + 0.14858084147864023, + 0.06360502555674424, + 0.027328474434104487 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 227848, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.34547224837362, + "eval_chrf_word_order": 2, + "eval_loss": 2.107067823410034, + "eval_meteor": 0.29983566586560506, + "eval_runtime": 885.7877, + "eval_samples_per_second": 19.415, + "eval_scarebleu_bp": 0.9823257798156602, + "eval_scarebleu_counts": [ + 101781, + 37875, + 15645, + 6527 + ], + "eval_scarebleu_precisions": [ + 41.324834040479914, + 16.532082060235705, + 7.382258985405352, + 3.3498937600722636 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.199413686817575, + "eval_scarebleu_sys_len": 246295, + "eval_scarebleu_totals": [ + 246295, + 229100, + 211927, + 194842 + ], + "eval_steps_per_second": 0.607, + "eval_ter_num_edits": 157565, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.15538835640591, + "step": 158500 + }, + { + "epoch": 62.28, + "learning_rate": 3.470854717726017e-05, + "loss": 1.9089, + "step": 159000 + }, + { + "epoch": 62.28, + "eval_bleu_bleu": 0.09571905714008087, + "eval_bleu_brevity_penalty": 0.9566799462076363, + "eval_bleu_length_ratio": 0.957591730702244, + "eval_bleu_precisions": [ + 0.3867005004952361, + 0.14870200351693771, + 0.0637443827036286, + 0.02733968412001629 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228174, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.34094186642432, + "eval_chrf_word_order": 2, + "eval_loss": 2.1063573360443115, + "eval_meteor": 0.30037090266748917, + "eval_runtime": 878.927, + "eval_samples_per_second": 19.567, + "eval_scarebleu_bp": 0.9830967991106747, + "eval_scarebleu_counts": [ + 101792, + 37942, + 15641, + 6512 + ], + "eval_scarebleu_precisions": [ + 41.297442035012274, + 16.5476034715862, + 7.373656420893834, + 3.338750942099947 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.196378633129696, + "eval_scarebleu_sys_len": 246485, + "eval_scarebleu_totals": [ + 246485, + 229290, + 212120, + 195043 + ], + "eval_steps_per_second": 0.612, + "eval_ter_num_edits": 157560, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.153098654113, + "step": 159000 + }, + { + "epoch": 62.48, + "learning_rate": 3.4659198578760364e-05, + "loss": 1.9108, + "step": 159500 + }, + { + "epoch": 62.48, + "eval_bleu_bleu": 0.09570189976895206, + "eval_bleu_brevity_penalty": 0.9589236780767392, + "eval_bleu_length_ratio": 0.9597446690644161, + "eval_bleu_precisions": [ + 0.38657641230153006, + 0.14814271934635825, + 0.0634803013461776, + 0.027289238856988144 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228687, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.34466398123215, + "eval_chrf_word_order": 2, + "eval_loss": 2.105936050415039, + "eval_meteor": 0.30083027619995945, + "eval_runtime": 895.3842, + "eval_samples_per_second": 19.207, + "eval_scarebleu_bp": 0.9844223967321762, + "eval_scarebleu_counts": [ + 101933, + 37891, + 15629, + 6513 + ], + "eval_scarebleu_precisions": [ + 41.29985576065994, + 16.501826955321253, + 7.356866141658155, + 3.3338281437953325 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.19336439817067, + "eval_scarebleu_sys_len": 246812, + "eval_scarebleu_totals": [ + 246812, + 229617, + 212441, + 195361 + ], + "eval_steps_per_second": 0.601, + "eval_ter_num_edits": 157537, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.1425660235656, + "step": 159500 + }, + { + "epoch": 62.67, + "learning_rate": 3.460984998026056e-05, + "loss": 1.9178, + "step": 160000 + }, + { + "epoch": 62.67, + "eval_bleu_bleu": 0.09536566651371585, + "eval_bleu_brevity_penalty": 0.9542997438152334, + "eval_bleu_length_ratio": 0.9553128895118748, + "eval_bleu_precisions": [ + 0.3858349697536803, + 0.14863426409929859, + 0.06370197904540163, + 0.02729955172218124 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 227631, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.362786383325535, + "eval_chrf_word_order": 2, + "eval_loss": 2.106112480163574, + "eval_meteor": 0.29962838164737177, + "eval_runtime": 896.037, + "eval_samples_per_second": 19.193, + "eval_scarebleu_bp": 0.9822608252023466, + "eval_scarebleu_counts": [ + 101453, + 37825, + 15583, + 6495 + ], + "eval_scarebleu_precisions": [ + 41.194336504533474, + 16.51141066159138, + 7.353558805347528, + 3.3336926227614985 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.161897434420977, + "eval_scarebleu_sys_len": 246279, + "eval_scarebleu_totals": [ + 246279, + 229084, + 211911, + 194829 + ], + "eval_steps_per_second": 0.6, + "eval_ter_num_edits": 157749, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.23964940078491, + "step": 160000 + }, + { + "epoch": 62.87, + "learning_rate": 3.4560501381760756e-05, + "loss": 1.9172, + "step": 160500 + }, + { + "epoch": 62.87, + "eval_bleu_bleu": 0.09629964291643578, + "eval_bleu_brevity_penalty": 0.9619121857228051, + "eval_bleu_length_ratio": 0.9626194503082521, + "eval_bleu_precisions": [ + 0.38600613849990406, + 0.14860234615438997, + 0.06373421259095548, + 0.02747669537953239 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229372, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.42457085936596, + "eval_chrf_word_order": 2, + "eval_loss": 2.102973222732544, + "eval_meteor": 0.30115313744659666, + "eval_runtime": 880.6956, + "eval_samples_per_second": 19.528, + "eval_scarebleu_bp": 0.9872623426147552, + "eval_scarebleu_counts": [ + 101986, + 38084, + 15760, + 6602 + ], + "eval_scarebleu_precisions": [ + 41.204133907576946, + 16.535327089818903, + 7.394062230229329, + 3.3673365296337856 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.267131751225088, + "eval_scarebleu_sys_len": 247514, + "eval_scarebleu_totals": [ + 247514, + 230319, + 213144, + 196060 + ], + "eval_steps_per_second": 0.611, + "eval_ter_num_edits": 157508, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.12928575026675, + "step": 160500 + }, + { + "epoch": 63.06, + "learning_rate": 3.4511251480457954e-05, + "loss": 1.9191, + "step": 161000 + }, + { + "epoch": 63.06, + "eval_bleu_bleu": 0.09558986400244632, + "eval_bleu_brevity_penalty": 0.9543567916669567, + "eval_bleu_length_ratio": 0.9553674474040935, + "eval_bleu_precisions": [ + 0.38758324401258104, + 0.14914302277511415, + 0.06378597629431881, + 0.027296763651218737 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 227644, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.34839203271826, + "eval_chrf_word_order": 2, + "eval_loss": 2.103398084640503, + "eval_meteor": 0.30030452123699736, + "eval_runtime": 898.052, + "eval_samples_per_second": 19.15, + "eval_scarebleu_bp": 0.9805217502258585, + "eval_scarebleu_counts": [ + 101753, + 37872, + 15608, + 6486 + ], + "eval_scarebleu_precisions": [ + 41.388076517890916, + 16.56287173745714, + 7.380227345803938, + 3.3362824575120364 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.176172345763703, + "eval_scarebleu_sys_len": 245851, + "eval_scarebleu_totals": [ + 245851, + 228656, + 211484, + 194408 + ], + "eval_steps_per_second": 0.599, + "eval_ter_num_edits": 157317, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.04181912267768, + "step": 161000 + }, + { + "epoch": 63.26, + "learning_rate": 3.446190288195815e-05, + "loss": 1.8911, + "step": 161500 + }, + { + "epoch": 63.26, + "eval_bleu_bleu": 0.09558201957239434, + "eval_bleu_brevity_penalty": 0.9593866943923496, + "eval_bleu_length_ratio": 0.9601895257240461, + "eval_bleu_precisions": [ + 0.38586407800937966, + 0.14847021238385996, + 0.06347557306479734, + 0.027092540813565436 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228793, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.433523400035455, + "eval_chrf_word_order": 2, + "eval_loss": 2.1054422855377197, + "eval_meteor": 0.3010338068155898, + "eval_runtime": 892.3912, + "eval_samples_per_second": 19.272, + "eval_scarebleu_bp": 0.9836037301421974, + "eval_scarebleu_counts": [ + 101725, + 37964, + 15637, + 6515 + ], + "eval_scarebleu_precisions": [ + 41.24934106483922, + 16.54817688468496, + 7.367533287473733, + 3.3383207452423167 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.196299350846525, + "eval_scarebleu_sys_len": 246610, + "eval_scarebleu_totals": [ + 246610, + 229415, + 212242, + 195158 + ], + "eval_steps_per_second": 0.603, + "eval_ter_num_edits": 157696, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.21537855648008, + "step": 161500 + }, + { + "epoch": 63.45, + "learning_rate": 3.441255428345835e-05, + "loss": 1.9026, + "step": 162000 + }, + { + "epoch": 63.45, + "eval_bleu_bleu": 0.09604705248151887, + "eval_bleu_brevity_penalty": 0.9577040009335345, + "eval_bleu_length_ratio": 0.9585737727621821, + "eval_bleu_precisions": [ + 0.38702234597737384, + 0.14947470089435783, + 0.06390072712843531, + 0.02736537635866495 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228408, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.46293426916391, + "eval_chrf_word_order": 2, + "eval_loss": 2.103778839111328, + "eval_meteor": 0.3020132372147158, + "eval_runtime": 882.7551, + "eval_samples_per_second": 19.482, + "eval_scarebleu_bp": 0.9836848156591972, + "eval_scarebleu_counts": [ + 101909, + 38115, + 15688, + 6533 + ], + "eval_scarebleu_precisions": [ + 41.32060171106516, + 16.612548216270405, + 7.390900824927801, + 3.3471495688617234 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.229225779172172, + "eval_scarebleu_sys_len": 246630, + "eval_scarebleu_totals": [ + 246630, + 229435, + 212261, + 195181 + ], + "eval_steps_per_second": 0.609, + "eval_ter_num_edits": 157303, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.03540795625753, + "step": 162000 + }, + { + "epoch": 63.65, + "learning_rate": 3.436320568495855e-05, + "loss": 1.9121, + "step": 162500 + }, + { + "epoch": 63.65, + "eval_bleu_bleu": 0.09658095155447538, + "eval_bleu_brevity_penalty": 0.9595002330325494, + "eval_bleu_length_ratio": 0.9602986415084838, + "eval_bleu_precisions": [ + 0.3867511002145801, + 0.14911824745775526, + 0.06423943227398951, + 0.02770904376743793 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228819, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.51096468550019, + "eval_chrf_word_order": 2, + "eval_loss": 2.103503704071045, + "eval_meteor": 0.3018293977057512, + "eval_runtime": 885.8305, + "eval_samples_per_second": 19.415, + "eval_scarebleu_bp": 0.9838307532931503, + "eval_scarebleu_counts": [ + 101964, + 38096, + 15793, + 6613 + ], + "eval_scarebleu_precisions": [ + 41.336868478022915, + 16.60166208366199, + 7.439141575912877, + 3.3875991230047333 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.282267397077854, + "eval_scarebleu_sys_len": 246666, + "eval_scarebleu_totals": [ + 246666, + 229471, + 212296, + 195212 + ], + "eval_steps_per_second": 0.607, + "eval_ter_num_edits": 157407, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.08303376395001, + "step": 162500 + }, + { + "epoch": 63.85, + "learning_rate": 3.4313857086458746e-05, + "loss": 1.9129, + "step": 163000 + }, + { + "epoch": 63.85, + "eval_bleu_bleu": 0.09614070503004692, + "eval_bleu_brevity_penalty": 0.9588319240240978, + "eval_bleu_length_ratio": 0.959656537084678, + "eval_bleu_precisions": [ + 0.3875434039166295, + 0.14921667746404946, + 0.06375412358665837, + 0.02741657969706372 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228666, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.45836864957393, + "eval_chrf_word_order": 2, + "eval_loss": 2.0966038703918457, + "eval_meteor": 0.30169168222046183, + "eval_runtime": 889.1898, + "eval_samples_per_second": 19.341, + "eval_scarebleu_bp": 0.983473979862278, + "eval_scarebleu_counts": [ + 102119, + 38087, + 15682, + 6560 + ], + "eval_scarebleu_precisions": [ + 41.41448142170023, + 16.60410754066343, + 7.389884500657371, + 3.3618613232204173 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.243698119743538, + "eval_scarebleu_sys_len": 246578, + "eval_scarebleu_totals": [ + 246578, + 229383, + 212209, + 195130 + ], + "eval_steps_per_second": 0.605, + "eval_ter_num_edits": 157283, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.02624914708589, + "step": 163000 + }, + { + "epoch": 64.04, + "learning_rate": 3.4264607185155944e-05, + "loss": 1.9055, + "step": 163500 + }, + { + "epoch": 64.04, + "eval_bleu_bleu": 0.09623543609366864, + "eval_bleu_brevity_penalty": 0.9554444946023479, + "eval_bleu_length_ratio": 0.9564082441171904, + "eval_bleu_precisions": [ + 0.38783722113983815, + 0.15000213576842575, + 0.06416993484315336, + 0.027570186124252813 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 227892, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.51573940240088, + "eval_chrf_word_order": 2, + "eval_loss": 2.100843906402588, + "eval_meteor": 0.3018152678522298, + "eval_runtime": 901.0792, + "eval_samples_per_second": 19.086, + "eval_scarebleu_bp": 0.9846532873315705, + "eval_scarebleu_counts": [ + 102170, + 38295, + 15827, + 6608 + ], + "eval_scarebleu_precisions": [ + 41.38632230049135, + 16.673633062514696, + 7.448, + 3.381348343354228 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.30544077935444, + "eval_scarebleu_sys_len": 246869, + "eval_scarebleu_totals": [ + 246869, + 229674, + 212500, + 195425 + ], + "eval_steps_per_second": 0.597, + "eval_ter_num_edits": 157244, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.00838946920122, + "step": 163500 + }, + { + "epoch": 64.24, + "learning_rate": 3.421525858665614e-05, + "loss": 1.8885, + "step": 164000 + }, + { + "epoch": 64.24, + "eval_bleu_bleu": 0.09587248945303208, + "eval_bleu_brevity_penalty": 0.9590853203396551, + "eval_bleu_length_ratio": 0.9598999492191926, + "eval_bleu_precisions": [ + 0.3868986201710358, + 0.14881647433685216, + 0.06353795814211924, + 0.027293900038910725 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228724, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.48293590765525, + "eval_chrf_word_order": 2, + "eval_loss": 2.097367286682129, + "eval_meteor": 0.3013271630222525, + "eval_runtime": 880.0984, + "eval_samples_per_second": 19.541, + "eval_scarebleu_bp": 0.9839280334098534, + "eval_scarebleu_counts": [ + 102006, + 38026, + 15641, + 6510 + ], + "eval_scarebleu_precisions": [ + 41.34987230937614, + 16.56942417046123, + 7.366571843032347, + 3.334289401979062 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.206652663172745, + "eval_scarebleu_sys_len": 246690, + "eval_scarebleu_totals": [ + 246690, + 229495, + 212324, + 195244 + ], + "eval_steps_per_second": 0.611, + "eval_ter_num_edits": 157450, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.10272520366901, + "step": 164000 + }, + { + "epoch": 64.43, + "learning_rate": 3.4165909988156336e-05, + "loss": 1.8894, + "step": 164500 + }, + { + "epoch": 64.43, + "eval_bleu_bleu": 0.09625296283008743, + "eval_bleu_brevity_penalty": 0.9608224833426404, + "eval_bleu_length_ratio": 0.9615702600732754, + "eval_bleu_precisions": [ + 0.387431150216915, + 0.14918816384887248, + 0.06387250145048085, + 0.027279786623451163 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229122, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.6094403137105, + "eval_chrf_word_order": 2, + "eval_loss": 2.096004009246826, + "eval_meteor": 0.30269295192080786, + "eval_runtime": 907.0625, + "eval_samples_per_second": 18.96, + "eval_scarebleu_bp": 0.9893165385676739, + "eval_scarebleu_counts": [ + 102562, + 38329, + 15826, + 6594 + ], + "eval_scarebleu_precisions": [ + 41.351810114384556, + 16.605004592163862, + 7.407303397081262, + 3.354547258214673 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.30686384504715, + "eval_scarebleu_sys_len": 248023, + "eval_scarebleu_totals": [ + 248023, + 230828, + 213654, + 196569 + ], + "eval_steps_per_second": 0.593, + "eval_ter_num_edits": 157183, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.98045510122773, + "step": 164500 + }, + { + "epoch": 64.63, + "learning_rate": 3.411656138965654e-05, + "loss": 1.9013, + "step": 165000 + }, + { + "epoch": 64.63, + "eval_bleu_bleu": 0.0960240418372507, + "eval_bleu_brevity_penalty": 0.9584342298384669, + "eval_bleu_length_ratio": 0.9592746318391465, + "eval_bleu_precisions": [ + 0.38697582850267964, + 0.14919576118838113, + 0.06387119694777545, + 0.027322805314429557 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228575, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.54224618446445, + "eval_chrf_word_order": 2, + "eval_loss": 2.097243547439575, + "eval_meteor": 0.30148053963011523, + "eval_runtime": 883.5302, + "eval_samples_per_second": 19.465, + "eval_scarebleu_bp": 0.982252705584277, + "eval_scarebleu_counts": [ + 101811, + 38065, + 15684, + 6544 + ], + "eval_scarebleu_precisions": [ + 41.34003581333214, + 16.616320793427683, + 7.401185397712258, + 3.3587566851781516 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.22844509389964, + "eval_scarebleu_sys_len": 246277, + "eval_scarebleu_totals": [ + 246277, + 229082, + 211912, + 194834 + ], + "eval_steps_per_second": 0.609, + "eval_ter_num_edits": 157511, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.1306595716425, + "step": 165000 + }, + { + "epoch": 64.83, + "learning_rate": 3.406731148835373e-05, + "loss": 1.8934, + "step": 165500 + }, + { + "epoch": 64.83, + "eval_bleu_bleu": 0.09669588952078617, + "eval_bleu_brevity_penalty": 0.9587008328025101, + "eval_bleu_length_ratio": 0.9595306342564809, + "eval_bleu_precisions": [ + 0.38743679910425305, + 0.14961147554164045, + 0.06423718344657196, + 0.027793764176173873 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228636, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.58061135324882, + "eval_chrf_word_order": 2, + "eval_loss": 2.096670150756836, + "eval_meteor": 0.3025152153653177, + "eval_runtime": 900.4306, + "eval_samples_per_second": 19.1, + "eval_scarebleu_bp": 0.9852727868471164, + "eval_scarebleu_counts": [ + 102180, + 38281, + 15827, + 6654 + ], + "eval_scarebleu_precisions": [ + 41.364736744095666, + 16.65644158432212, + 7.442606299434763, + 3.4023449284403107 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.323624438672423, + "eval_scarebleu_sys_len": 247022, + "eval_scarebleu_totals": [ + 247022, + 229827, + 212654, + 195571 + ], + "eval_steps_per_second": 0.597, + "eval_ter_num_edits": 157223, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.99877271957101, + "step": 165500 + }, + { + "epoch": 65.02, + "learning_rate": 3.401796288985393e-05, + "loss": 1.9043, + "step": 166000 + }, + { + "epoch": 65.02, + "eval_bleu_bleu": 0.09687927778969782, + "eval_bleu_brevity_penalty": 0.9602422963358532, + "eval_bleu_length_ratio": 0.9610120908682679, + "eval_bleu_precisions": [ + 0.3876561756241566, + 0.14954153564312492, + 0.06426486908627564, + 0.027811094030665968 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228989, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.56731621680797, + "eval_chrf_word_order": 2, + "eval_loss": 2.0984363555908203, + "eval_meteor": 0.30217875578779124, + "eval_runtime": 881.3546, + "eval_samples_per_second": 19.513, + "eval_scarebleu_bp": 0.9865672506541593, + "eval_scarebleu_counts": [ + 102357, + 38298, + 15816, + 6675 + ], + "eval_scarebleu_precisions": [ + 41.38278173541089, + 16.640668789947295, + 7.426328343632027, + 3.407524631170555 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.33515848822203, + "eval_scarebleu_sys_len": 247342, + "eval_scarebleu_totals": [ + 247342, + 230147, + 212972, + 195890 + ], + "eval_steps_per_second": 0.61, + "eval_ter_num_edits": 157164, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.97175423251468, + "step": 166000 + }, + { + "epoch": 65.22, + "learning_rate": 3.396861429135413e-05, + "loss": 1.8833, + "step": 166500 + }, + { + "epoch": 65.22, + "eval_bleu_bleu": 0.09668703899640418, + "eval_bleu_brevity_penalty": 0.9592818785160087, + "eval_bleu_length_ratio": 0.9600888034614884, + "eval_bleu_precisions": [ + 0.38683125773159827, + 0.14959305018575061, + 0.06430739159508256, + 0.0277328311843537 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228769, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.57447197101524, + "eval_chrf_word_order": 2, + "eval_loss": 2.096048593521118, + "eval_meteor": 0.3017103429626479, + "eval_runtime": 881.3746, + "eval_samples_per_second": 19.513, + "eval_scarebleu_bp": 0.9850703776046533, + "eval_scarebleu_counts": [ + 102102, + 38299, + 15839, + 6678 + ], + "eval_scarebleu_precisions": [ + 41.341528594334584, + 16.667899746275737, + 7.450106067233927, + 3.41550736497545 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.33544391463128, + "eval_scarebleu_sys_len": 246972, + "eval_scarebleu_totals": [ + 246972, + 229777, + 212601, + 195520 + ], + "eval_steps_per_second": 0.61, + "eval_ter_num_edits": 157333, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.04914617001498, + "step": 166500 + }, + { + "epoch": 65.41, + "learning_rate": 3.3919265692854326e-05, + "loss": 1.8834, + "step": 167000 + }, + { + "epoch": 65.41, + "eval_bleu_bleu": 0.09735762733372984, + "eval_bleu_brevity_penalty": 0.9601899327326467, + "eval_bleu_length_ratio": 0.960961729736989, + "eval_bleu_precisions": [ + 0.3875236377452757, + 0.1501827350766354, + 0.06474602049100307, + 0.028049171927176896 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228977, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.56896317330953, + "eval_chrf_word_order": 2, + "eval_loss": 2.092973232269287, + "eval_meteor": 0.30272942865066477, + "eval_runtime": 886.4858, + "eval_samples_per_second": 19.4, + "eval_scarebleu_bp": 0.9858838178101275, + "eval_scarebleu_counts": [ + 102325, + 38388, + 15930, + 6711 + ], + "eval_scarebleu_precisions": [ + 41.398130054658075, + 16.69203141170025, + 7.485656016954329, + 3.428702804884279 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.377272103133022, + "eval_scarebleu_sys_len": 247173, + "eval_scarebleu_totals": [ + 247173, + 229978, + 212807, + 195730 + ], + "eval_steps_per_second": 0.607, + "eval_ter_num_edits": 157196, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.9864083271893, + "step": 167000 + }, + { + "epoch": 65.61, + "learning_rate": 3.3870015791551524e-05, + "loss": 1.886, + "step": 167500 + }, + { + "epoch": 65.61, + "eval_bleu_bleu": 0.09651998384407016, + "eval_bleu_brevity_penalty": 0.9569294879141641, + "eval_bleu_length_ratio": 0.9578309460758186, + "eval_bleu_precisions": [ + 0.3880673528135968, + 0.14998862753274322, + 0.06437203736466655, + 0.027623996968994396 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228231, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.509324802818995, + "eval_chrf_word_order": 2, + "eval_loss": 2.0901103019714355, + "eval_meteor": 0.30218263603348416, + "eval_runtime": 876.7129, + "eval_samples_per_second": 19.616, + "eval_scarebleu_bp": 0.9841144609437208, + "eval_scarebleu_counts": [ + 102232, + 38237, + 15795, + 6620 + ], + "eval_scarebleu_precisions": [ + 41.433759159587574, + 16.65802623496456, + 7.437596236703443, + 3.389743721037405 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.302901660317794, + "eval_scarebleu_sys_len": 246736, + "eval_scarebleu_totals": [ + 246736, + 229541, + 212367, + 195295 + ], + "eval_steps_per_second": 0.614, + "eval_ter_num_edits": 157165, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.97221217297327, + "step": 167500 + }, + { + "epoch": 65.8, + "learning_rate": 3.382066719305172e-05, + "loss": 1.8875, + "step": 168000 + }, + { + "epoch": 65.8, + "eval_bleu_bleu": 0.09765092574972643, + "eval_bleu_brevity_penalty": 0.9621909660549092, + "eval_bleu_length_ratio": 0.9628880430084061, + "eval_bleu_precisions": [ + 0.3876331526002894, + 0.15018304663095255, + 0.06487528321423812, + 0.028089193439676478 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229436, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.679754727014135, + "eval_chrf_word_order": 2, + "eval_loss": 2.0891895294189453, + "eval_meteor": 0.3035694078003616, + "eval_runtime": 871.7243, + "eval_samples_per_second": 19.729, + "eval_scarebleu_bp": 0.9856815304250173, + "eval_scarebleu_counts": [ + 102368, + 38449, + 15968, + 6752 + ], + "eval_scarebleu_precisions": [ + 41.4239063138599, + 16.722191294666157, + 7.505311248566433, + 3.450549113599313 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.407406257963533, + "eval_scarebleu_sys_len": 247123, + "eval_scarebleu_totals": [ + 247123, + 229928, + 212756, + 195679 + ], + "eval_steps_per_second": 0.617, + "eval_ter_num_edits": 157118, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.95068897141994, + "step": 168000 + }, + { + "epoch": 66.0, + "learning_rate": 3.3771318594551917e-05, + "loss": 1.8917, + "step": 168500 + }, + { + "epoch": 66.0, + "eval_bleu_bleu": 0.09718393644196359, + "eval_bleu_brevity_penalty": 0.9603251999901073, + "eval_bleu_length_ratio": 0.9610918293261261, + "eval_bleu_precisions": [ + 0.38811307901907355, + 0.14971696732495174, + 0.06438736193167223, + 0.02803333145656213 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229008, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.59055813228703, + "eval_chrf_word_order": 2, + "eval_loss": 2.0851340293884277, + "eval_meteor": 0.30309670810388084, + "eval_runtime": 883.1641, + "eval_samples_per_second": 19.473, + "eval_scarebleu_bp": 0.9824110264564475, + "eval_scarebleu_counts": [ + 102146, + 38142, + 15765, + 6651 + ], + "eval_scarebleu_precisions": [ + 41.469494470517546, + 16.647099131026838, + 7.438145205427746, + 3.4130621083907653 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.303482490566582, + "eval_scarebleu_sys_len": 246316, + "eval_scarebleu_totals": [ + 246316, + 229121, + 211948, + 194869 + ], + "eval_steps_per_second": 0.609, + "eval_ter_num_edits": 157182, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.97999716076916, + "step": 168500 + }, + { + "epoch": 66.2, + "learning_rate": 3.372196999605211e-05, + "loss": 1.8712, + "step": 169000 + }, + { + "epoch": 66.2, + "eval_bleu_bleu": 0.09693619971322982, + "eval_bleu_brevity_penalty": 0.9564215858946599, + "eval_bleu_length_ratio": 0.9573441218067895, + "eval_bleu_precisions": [ + 0.3875808254608421, + 0.15014223402237814, + 0.06460603120371183, + 0.028067792773675125 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228115, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.65792507778803, + "eval_chrf_word_order": 2, + "eval_loss": 2.0938174724578857, + "eval_meteor": 0.3019079006062239, + "eval_runtime": 883.445, + "eval_samples_per_second": 19.467, + "eval_scarebleu_bp": 0.9818791331411618, + "eval_scarebleu_counts": [ + 101972, + 38248, + 15816, + 6677 + ], + "eval_scarebleu_precisions": [ + 41.420882669537136, + 16.70291279095157, + 7.466822776264417, + 3.428762163966416 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.327373542758174, + "eval_scarebleu_sys_len": 246185, + "eval_scarebleu_totals": [ + 246185, + 228990, + 211817, + 194735 + ], + "eval_steps_per_second": 0.609, + "eval_ter_num_edits": 157359, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.06105262193809, + "step": 169000 + }, + { + "epoch": 66.39, + "learning_rate": 3.367272009474931e-05, + "loss": 1.8692, + "step": 169500 + }, + { + "epoch": 66.39, + "eval_bleu_bleu": 0.09709517714487899, + "eval_bleu_brevity_penalty": 0.9609489473544581, + "eval_bleu_length_ratio": 0.9616919661405328, + "eval_bleu_precisions": [ + 0.38792761105122825, + 0.14998395893487326, + 0.06449857542544726, + 0.02777433981795065 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229151, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.63458755616925, + "eval_chrf_word_order": 2, + "eval_loss": 2.0880398750305176, + "eval_meteor": 0.3030631986023125, + "eval_runtime": 884.0341, + "eval_samples_per_second": 19.454, + "eval_scarebleu_bp": 0.9865995910871563, + "eval_scarebleu_counts": [ + 102474, + 38387, + 15905, + 6678 + ], + "eval_scarebleu_precisions": [ + 41.42874469375379, + 16.678759966109794, + 7.467732166417038, + 3.408742879310697 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.361954835437794, + "eval_scarebleu_sys_len": 247350, + "eval_scarebleu_totals": [ + 247350, + 230155, + 212983, + 195908 + ], + "eval_steps_per_second": 0.609, + "eval_ter_num_edits": 157127, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.95481043554717, + "step": 169500 + }, + { + "epoch": 66.59, + "learning_rate": 3.362337149624951e-05, + "loss": 1.8823, + "step": 170000 + }, + { + "epoch": 66.59, + "eval_bleu_bleu": 0.09723773390220972, + "eval_bleu_brevity_penalty": 0.961489516726064, + "eval_bleu_length_ratio": 0.9622123644970811, + "eval_bleu_precisions": [ + 0.38784865336386437, + 0.14988211995473405, + 0.06441617073671249, + 0.0279353478566409 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229275, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.606704898018556, + "eval_chrf_word_order": 2, + "eval_loss": 2.0876386165618896, + "eval_meteor": 0.30320266446097, + "eval_runtime": 877.5064, + "eval_samples_per_second": 19.599, + "eval_scarebleu_bp": 0.9856774842658502, + "eval_scarebleu_counts": [ + 102330, + 38334, + 15877, + 6694 + ], + "eval_scarebleu_precisions": [ + 41.40869691893073, + 16.672248148325338, + 7.462609398648204, + 3.4209786636003576 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.357076145844157, + "eval_scarebleu_sys_len": 247122, + "eval_scarebleu_totals": [ + 247122, + 229927, + 212754, + 195675 + ], + "eval_steps_per_second": 0.613, + "eval_ter_num_edits": 157156, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.96809070884603, + "step": 170000 + }, + { + "epoch": 66.78, + "learning_rate": 3.357402289774971e-05, + "loss": 1.8762, + "step": 170500 + }, + { + "epoch": 66.78, + "eval_bleu_bleu": 0.09723910669134933, + "eval_bleu_brevity_penalty": 0.9593997956358763, + "eval_bleu_length_ratio": 0.9602021160068659, + "eval_bleu_precisions": [ + 0.3889403660903163, + 0.15051913743318793, + 0.06460024068874008, + 0.0279033585497018 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228796, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.69500147202816, + "eval_chrf_word_order": 2, + "eval_loss": 2.085594415664673, + "eval_meteor": 0.30343697354064614, + "eval_runtime": 887.2719, + "eval_samples_per_second": 19.383, + "eval_scarebleu_bp": 0.9858474090577152, + "eval_scarebleu_counts": [ + 102596, + 38523, + 15921, + 6683 + ], + "eval_scarebleu_precisions": [ + 41.50928128691881, + 16.7513882305876, + 7.481778408530196, + 3.414589283615796 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.381369744787106, + "eval_scarebleu_sys_len": 247164, + "eval_scarebleu_totals": [ + 247164, + 229969, + 212797, + 195719 + ], + "eval_steps_per_second": 0.606, + "eval_ter_num_edits": 156934, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.86642792704092, + "step": 170500 + }, + { + "epoch": 66.98, + "learning_rate": 3.3524674299249906e-05, + "loss": 1.8844, + "step": 171000 + }, + { + "epoch": 66.98, + "eval_bleu_bleu": 0.09734116074583911, + "eval_bleu_brevity_penalty": 0.9585041650762318, + "eval_bleu_length_ratio": 0.959341780014185, + "eval_bleu_precisions": [ + 0.38911418209815785, + 0.15059414558459006, + 0.06486372388513062, + 0.027984853529567782 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228591, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.68559952545107, + "eval_chrf_word_order": 2, + "eval_loss": 2.083364963531494, + "eval_meteor": 0.3033112203664354, + "eval_runtime": 902.9978, + "eval_samples_per_second": 19.045, + "eval_scarebleu_bp": 0.9827397680639525, + "eval_scarebleu_counts": [ + 102388, + 38399, + 15893, + 6693 + ], + "eval_scarebleu_precisions": [ + 41.55407736295491, + 16.753344211656092, + 7.4956374098005, + 3.433011899876898 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.369419456955162, + "eval_scarebleu_sys_len": 246397, + "eval_scarebleu_totals": [ + 246397, + 229202, + 212030, + 194960 + ], + "eval_steps_per_second": 0.596, + "eval_ter_num_edits": 157001, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.89710993776589, + "step": 171000 + }, + { + "epoch": 67.18, + "learning_rate": 3.34754243979471e-05, + "loss": 1.8511, + "step": 171500 + }, + { + "epoch": 67.18, + "eval_bleu_bleu": 0.09683889766686163, + "eval_bleu_brevity_penalty": 0.9606654721549959, + "eval_bleu_length_ratio": 0.9614191766794388, + "eval_bleu_precisions": [ + 0.3878194215272867, + 0.14977983963452907, + 0.06421165607941211, + 0.027683043502729474 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229086, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.6799614346122, + "eval_chrf_word_order": 2, + "eval_loss": 2.0879604816436768, + "eval_meteor": 0.3025752239158362, + "eval_runtime": 888.9848, + "eval_samples_per_second": 19.346, + "eval_scarebleu_bp": 0.9872138632984448, + "eval_scarebleu_counts": [ + 102518, + 38434, + 15853, + 6650 + ], + "eval_scarebleu_precisions": [ + 41.4210794256208, + 16.68815971724698, + 7.438008773781875, + 3.391836130960578 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.344662950944025, + "eval_scarebleu_sys_len": 247502, + "eval_scarebleu_totals": [ + 247502, + 230307, + 213135, + 196059 + ], + "eval_steps_per_second": 0.605, + "eval_ter_num_edits": 157217, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.99602507681952, + "step": 171500 + }, + { + "epoch": 67.37, + "learning_rate": 3.34260757994473e-05, + "loss": 1.8606, + "step": 172000 + }, + { + "epoch": 67.37, + "eval_bleu_bleu": 0.09678096668757652, + "eval_bleu_brevity_penalty": 0.960735257828986, + "eval_bleu_length_ratio": 0.9614863248544773, + "eval_bleu_precisions": [ + 0.3883684996202565, + 0.15017436894486733, + 0.06429433361575393, + 0.027462014631401237 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229102, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.69318244695336, + "eval_chrf_word_order": 2, + "eval_loss": 2.0868899822235107, + "eval_meteor": 0.3029921447955039, + "eval_runtime": 882.0089, + "eval_samples_per_second": 19.499, + "eval_scarebleu_bp": 0.9848274332301573, + "eval_scarebleu_counts": [ + 102470, + 38377, + 15809, + 6578 + ], + "eval_scarebleu_precisions": [ + 41.50061560393986, + 16.706208073412068, + 7.43798931044866, + 3.365342801450914 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.303539564114054, + "eval_scarebleu_sys_len": 246912, + "eval_scarebleu_totals": [ + 246912, + 229717, + 212544, + 195463 + ], + "eval_steps_per_second": 0.61, + "eval_ter_num_edits": 157103, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.94381986454121, + "step": 172000 + }, + { + "epoch": 67.57, + "learning_rate": 3.33767272009475e-05, + "loss": 1.8682, + "step": 172500 + }, + { + "epoch": 67.57, + "eval_bleu_bleu": 0.09737555778263836, + "eval_bleu_brevity_penalty": 0.9667453726375592, + "eval_bleu_length_ratio": 0.9672862484734283, + "eval_bleu_precisions": [ + 0.3869205671543361, + 0.14983895090698535, + 0.06424787514467371, + 0.02763415042715953 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230484, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.803940236975386, + "eval_chrf_word_order": 2, + "eval_loss": 2.0870554447174072, + "eval_meteor": 0.30406442661846866, + "eval_runtime": 904.8102, + "eval_samples_per_second": 19.007, + "eval_scarebleu_bp": 0.9902756167422008, + "eval_scarebleu_counts": [ + 102661, + 38573, + 15958, + 6712 + ], + "eval_scarebleu_precisions": [ + 41.352044823794316, + 16.69349882717492, + 7.460635074989715, + 3.410274518969398 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.40009473476636, + "eval_scarebleu_sys_len": 248261, + "eval_scarebleu_totals": [ + 248261, + 231066, + 213896, + 196817 + ], + "eval_steps_per_second": 0.595, + "eval_ter_num_edits": 157175, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.97679157755908, + "step": 172500 + }, + { + "epoch": 67.76, + "learning_rate": 3.332737860244769e-05, + "loss": 1.876, + "step": 173000 + }, + { + "epoch": 67.76, + "eval_bleu_bleu": 0.09695993820893188, + "eval_bleu_brevity_penalty": 0.9594041626804595, + "eval_bleu_length_ratio": 0.9602063127678058, + "eval_bleu_precisions": [ + 0.38802082195133675, + 0.1503199402652149, + 0.0645285716489835, + 0.027716554962430175 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228797, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.72180504938234, + "eval_chrf_word_order": 2, + "eval_loss": 2.0837759971618652, + "eval_meteor": 0.30288350371142614, + "eval_runtime": 906.0936, + "eval_samples_per_second": 18.98, + "eval_scarebleu_bp": 0.9831292502660812, + "eval_scarebleu_counts": [ + 102189, + 38376, + 15851, + 6619 + ], + "eval_scarebleu_precisions": [ + 41.457161055283514, + 16.736299488002512, + 7.472445621941676, + 3.3934714510563904 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.322754933611867, + "eval_scarebleu_sys_len": 246493, + "eval_scarebleu_totals": [ + 246493, + 229298, + 212126, + 195051 + ], + "eval_steps_per_second": 0.594, + "eval_ter_num_edits": 157082, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.934203114911, + "step": 173000 + }, + { + "epoch": 67.96, + "learning_rate": 3.327812870114489e-05, + "loss": 1.8835, + "step": 173500 + }, + { + "epoch": 67.96, + "eval_bleu_bleu": 0.09708879202468527, + "eval_bleu_brevity_penalty": 0.9578833260045182, + "eval_bleu_length_ratio": 0.9587458399607183, + "eval_bleu_precisions": [ + 0.3888482768582922, + 0.15090365152849178, + 0.06475313126317037, + 0.027776993329680942 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228449, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.84847513673323, + "eval_chrf_word_order": 2, + "eval_loss": 2.0840365886688232, + "eval_meteor": 0.30315872839942376, + "eval_runtime": 882.9958, + "eval_samples_per_second": 19.477, + "eval_scarebleu_bp": 0.9844061919121617, + "eval_scarebleu_counts": [ + 102562, + 38532, + 15948, + 6682 + ], + "eval_scarebleu_precisions": [ + 41.555379080094646, + 16.78127980558592, + 7.507060817171907, + 3.420317154820282 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.38731925642511, + "eval_scarebleu_sys_len": 246808, + "eval_scarebleu_totals": [ + 246808, + 229613, + 212440, + 195362 + ], + "eval_steps_per_second": 0.609, + "eval_ter_num_edits": 157055, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.9218387225293, + "step": 173500 + }, + { + "epoch": 68.16, + "learning_rate": 3.322878010264509e-05, + "loss": 1.8577, + "step": 174000 + }, + { + "epoch": 68.16, + "eval_bleu_bleu": 0.09697224231895986, + "eval_bleu_brevity_penalty": 0.9601462943854764, + "eval_bleu_length_ratio": 0.9609197621275899, + "eval_bleu_precisions": [ + 0.3878026091096097, + 0.1501331620799728, + 0.06444651124551028, + 0.027730221661560642 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228967, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.78213145552192, + "eval_chrf_word_order": 2, + "eval_loss": 2.086319923400879, + "eval_meteor": 0.3028799512410185, + "eval_runtime": 900.4775, + "eval_samples_per_second": 19.099, + "eval_scarebleu_bp": 0.9848071852414166, + "eval_scarebleu_counts": [ + 102349, + 38408, + 15880, + 6650 + ], + "eval_scarebleu_precisions": [ + 41.452449707784716, + 16.72006686633698, + 7.471569923637544, + 3.4021958232290674 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.345954938797002, + "eval_scarebleu_sys_len": 246907, + "eval_scarebleu_totals": [ + 246907, + 229712, + 212539, + 195462 + ], + "eval_steps_per_second": 0.597, + "eval_ter_num_edits": 157269, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 72.01983798066576, + "step": 174000 + }, + { + "epoch": 68.35, + "learning_rate": 3.317943150414528e-05, + "loss": 1.8581, + "step": 174500 + }, + { + "epoch": 68.35, + "eval_bleu_bleu": 0.097758624873431, + "eval_bleu_brevity_penalty": 0.9584167452965814, + "eval_bleu_length_ratio": 0.9592578447953869, + "eval_bleu_precisions": [ + 0.38850510344706896, + 0.1509774051926425, + 0.06521190651501187, + 0.028298745350799466 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228571, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.79508014762538, + "eval_chrf_word_order": 2, + "eval_loss": 2.085430145263672, + "eval_meteor": 0.30336689016943735, + "eval_runtime": 874.8303, + "eval_samples_per_second": 19.659, + "eval_scarebleu_bp": 0.9844629076512799, + "eval_scarebleu_counts": [ + 102458, + 38593, + 16045, + 6753 + ], + "eval_scarebleu_precisions": [ + 41.51088638776122, + 16.806821497471987, + 7.55225861720004, + 3.456359178826793 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.436290704088359, + "eval_scarebleu_sys_len": 246822, + "eval_scarebleu_totals": [ + 246822, + 229627, + 212453, + 195379 + ], + "eval_steps_per_second": 0.615, + "eval_ter_num_edits": 157028, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.90947433014759, + "step": 174500 + }, + { + "epoch": 68.55, + "learning_rate": 3.313008290564548e-05, + "loss": 1.856, + "step": 175000 + }, + { + "epoch": 68.55, + "eval_bleu_bleu": 0.09794436987386987, + "eval_bleu_brevity_penalty": 0.9613413240392183, + "eval_bleu_length_ratio": 0.9620696746251244, + "eval_bleu_precisions": [ + 0.3891145126744343, + 0.15100025466172434, + 0.06500656787488199, + 0.02820948225450947 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229241, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.84579487081182, + "eval_chrf_word_order": 2, + "eval_loss": 2.083065986633301, + "eval_meteor": 0.30363894343261494, + "eval_runtime": 906.3417, + "eval_samples_per_second": 18.975, + "eval_scarebleu_bp": 0.985726037110833, + "eval_scarebleu_counts": [ + 102742, + 38613, + 15995, + 6753 + ], + "eval_scarebleu_precisions": [ + 41.57339742811592, + 16.79271458952157, + 7.517613163695498, + 3.450813263632322 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.435119103576596, + "eval_scarebleu_sys_len": 247134, + "eval_scarebleu_totals": [ + 247134, + 229939, + 212767, + 195693 + ], + "eval_steps_per_second": 0.594, + "eval_ter_num_edits": 156715, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.76613896661156, + "step": 175000 + }, + { + "epoch": 68.74, + "learning_rate": 3.308083300434268e-05, + "loss": 1.8621, + "step": 175500 + }, + { + "epoch": 68.74, + "eval_bleu_bleu": 0.09774147631345603, + "eval_bleu_brevity_penalty": 0.9611887506890342, + "eval_bleu_length_ratio": 0.9619227879922276, + "eval_bleu_precisions": [ + 0.38908667312374023, + 0.15093084792770187, + 0.06494672879929382, + 0.028034912886499376 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229206, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.81260217458775, + "eval_chrf_word_order": 2, + "eval_loss": 2.077259063720703, + "eval_meteor": 0.304581519085826, + "eval_runtime": 886.5686, + "eval_samples_per_second": 19.398, + "eval_scarebleu_bp": 0.9869269798624279, + "eval_scarebleu_counts": [ + 102827, + 38652, + 15994, + 6743 + ], + "eval_scarebleu_precisions": [ + 41.55784845067918, + 16.787991452248995, + 7.506629432332856, + 3.440534321153954 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.43446075098597, + "eval_scarebleu_sys_len": 247431, + "eval_scarebleu_totals": [ + 247431, + 230236, + 213065, + 195987 + ], + "eval_steps_per_second": 0.607, + "eval_ter_num_edits": 156812, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.81055919109397, + "step": 175500 + }, + { + "epoch": 68.94, + "learning_rate": 3.303148440584288e-05, + "loss": 1.8655, + "step": 176000 + }, + { + "epoch": 68.94, + "eval_bleu_bleu": 0.09858561668293718, + "eval_bleu_brevity_penalty": 0.9631182435295741, + "eval_bleu_length_ratio": 0.9637819530886063, + "eval_bleu_precisions": [ + 0.3891503990873028, + 0.1514021858849445, + 0.06534284382952794, + 0.028515969054872064 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229649, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.84898836609154, + "eval_chrf_word_order": 2, + "eval_loss": 2.0748279094696045, + "eval_meteor": 0.30531634171286975, + "eval_runtime": 905.8181, + "eval_samples_per_second": 18.986, + "eval_scarebleu_bp": 0.9889616908129232, + "eval_scarebleu_counts": [ + 103021, + 38783, + 16084, + 6812 + ], + "eval_scarebleu_precisions": [ + 41.55161635105976, + 16.808095692121, + 7.53112606348359, + 3.4668783844306015 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.492267028234114, + "eval_scarebleu_sys_len": 247935, + "eval_scarebleu_totals": [ + 247935, + 230740, + 213567, + 196488 + ], + "eval_steps_per_second": 0.594, + "eval_ter_num_edits": 156685, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.75240075285411, + "step": 176000 + }, + { + "epoch": 69.13, + "learning_rate": 3.298213580734307e-05, + "loss": 1.8546, + "step": 176500 + }, + { + "epoch": 69.13, + "eval_bleu_bleu": 0.09821461739230929, + "eval_bleu_brevity_penalty": 0.9623651657987161, + "eval_bleu_length_ratio": 0.9630559134460024, + "eval_bleu_precisions": [ + 0.38896006554062296, + 0.15120524210833752, + 0.06518552685526856, + 0.028295794657547325 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229476, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.83761293894894, + "eval_chrf_word_order": 2, + "eval_loss": 2.0792179107666016, + "eval_meteor": 0.30452710740492167, + "eval_runtime": 877.524, + "eval_samples_per_second": 19.598, + "eval_scarebleu_bp": 0.9886954732497283, + "eval_scarebleu_counts": [ + 102931, + 38803, + 16082, + 6789 + ], + "eval_scarebleu_precisions": [ + 41.52637078456765, + 16.821575036631785, + 7.53251741209643, + 3.4562810232913326 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.481470179521395, + "eval_scarebleu_sys_len": 247869, + "eval_scarebleu_totals": [ + 247869, + 230674, + 213501, + 196425 + ], + "eval_steps_per_second": 0.613, + "eval_ter_num_edits": 156833, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.82017594072418, + "step": 176500 + }, + { + "epoch": 69.33, + "learning_rate": 3.2932787208843266e-05, + "loss": 1.8431, + "step": 177000 + }, + { + "epoch": 69.33, + "eval_bleu_bleu": 0.09821680208045891, + "eval_bleu_brevity_penalty": 0.9599848166024076, + "eval_bleu_length_ratio": 0.9607644819728134, + "eval_bleu_precisions": [ + 0.3892849342593806, + 0.1516376602829008, + 0.0653948152868861, + 0.028383615348218913 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228930, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.82055381781796, + "eval_chrf_word_order": 2, + "eval_loss": 2.080317258834839, + "eval_meteor": 0.3045732764072218, + "eval_runtime": 913.5153, + "eval_samples_per_second": 18.826, + "eval_scarebleu_bp": 0.9859849463767841, + "eval_scarebleu_counts": [ + 102742, + 38764, + 16094, + 6790 + ], + "eval_scarebleu_precisions": [ + 41.56263400189322, + 16.853693212697227, + 7.561903866936052, + 3.4686923693876404 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.47939646326486, + "eval_scarebleu_sys_len": 247198, + "eval_scarebleu_totals": [ + 247198, + 230003, + 212830, + 195751 + ], + "eval_steps_per_second": 0.589, + "eval_ter_num_edits": 156783, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.7972789177951, + "step": 177000 + }, + { + "epoch": 69.53, + "learning_rate": 3.288353730754047e-05, + "loss": 1.8557, + "step": 177500 + }, + { + "epoch": 69.53, + "eval_bleu_bleu": 0.09827911543072787, + "eval_bleu_brevity_penalty": 0.9639012132516708, + "eval_bleu_length_ratio": 0.9645373700577894, + "eval_bleu_precisions": [ + 0.3883191416226847, + 0.1510200626428511, + 0.06516501000138127, + 0.028279839265598468 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229829, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.88992257276902, + "eval_chrf_word_order": 2, + "eval_loss": 2.0765602588653564, + "eval_meteor": 0.30449828769430376, + "eval_runtime": 899.3826, + "eval_samples_per_second": 19.122, + "eval_scarebleu_bp": 0.9883404074683583, + "eval_scarebleu_counts": [ + 102796, + 38715, + 16073, + 6761 + ], + "eval_scarebleu_precisions": [ + 41.48663537559377, + 16.789831125913977, + 7.5313709503593955, + 3.4436040441082842 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.458215846229574, + "eval_scarebleu_sys_len": 247781, + "eval_scarebleu_totals": [ + 247781, + 230586, + 213414, + 196335 + ], + "eval_steps_per_second": 0.598, + "eval_ter_num_edits": 156905, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.85314765374206, + "step": 177500 + }, + { + "epoch": 69.72, + "learning_rate": 3.283418870904067e-05, + "loss": 1.8463, + "step": 178000 + }, + { + "epoch": 69.72, + "eval_bleu_bleu": 0.09824996627200164, + "eval_bleu_brevity_penalty": 0.9613587595688059, + "eval_bleu_length_ratio": 0.962086461668884, + "eval_bleu_precisions": [ + 0.38852755785295207, + 0.1514265503419005, + 0.0654167243918333, + 0.028344907082009613 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229245, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.86696588984965, + "eval_chrf_word_order": 2, + "eval_loss": 2.080667495727539, + "eval_meteor": 0.30417263063359695, + "eval_runtime": 891.9536, + "eval_samples_per_second": 19.281, + "eval_scarebleu_bp": 0.9857058070411465, + "eval_scarebleu_counts": [ + 102550, + 38649, + 16082, + 6770 + ], + "eval_scarebleu_precisions": [ + 41.49654633814728, + 16.808736420016178, + 7.558751645046061, + 3.4596771308698253 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.455274005846205, + "eval_scarebleu_sys_len": 247129, + "eval_scarebleu_totals": [ + 247129, + 229934, + 212760, + 195683 + ], + "eval_steps_per_second": 0.603, + "eval_ter_num_edits": 156834, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.82063388118277, + "step": 178000 + }, + { + "epoch": 69.92, + "learning_rate": 3.278484011054086e-05, + "loss": 1.8534, + "step": 178500 + }, + { + "epoch": 69.92, + "eval_bleu_bleu": 0.09823195280402376, + "eval_bleu_brevity_penalty": 0.9578920727811508, + "eval_bleu_length_ratio": 0.9587542334825981, + "eval_bleu_precisions": [ + 0.38881860880451385, + 0.15148918847275344, + 0.06564826502485896, + 0.028601766712604206 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228451, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.80241071488176, + "eval_chrf_word_order": 2, + "eval_loss": 2.076969861984253, + "eval_meteor": 0.30344758377068387, + "eval_runtime": 889.7756, + "eval_samples_per_second": 19.328, + "eval_scarebleu_bp": 0.9828371525937057, + "eval_scarebleu_counts": [ + 102383, + 38604, + 16060, + 6813 + ], + "eval_scarebleu_precisions": [ + 41.548001184963944, + 16.8410215246089, + 7.573578303537324, + 3.4943299841516517 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.46508992222991, + "eval_scarebleu_sys_len": 246421, + "eval_scarebleu_totals": [ + 246421, + 229226, + 212053, + 194973 + ], + "eval_steps_per_second": 0.605, + "eval_ter_num_edits": 156897, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.8494841300734, + "step": 178500 + }, + { + "epoch": 70.11, + "learning_rate": 3.273549151204106e-05, + "loss": 1.848, + "step": 179000 + }, + { + "epoch": 70.11, + "eval_bleu_bleu": 0.09825816710872362, + "eval_bleu_brevity_penalty": 0.9600721049990573, + "eval_bleu_length_ratio": 0.9608484171916115, + "eval_bleu_precisions": [ + 0.3899322996287399, + 0.1519066846119336, + 0.06554091553783223, + 0.028260551244072493 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228950, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.89270157946843, + "eval_chrf_word_order": 2, + "eval_loss": 2.0775656700134277, + "eval_meteor": 0.30507217778519075, + "eval_runtime": 863.5068, + "eval_samples_per_second": 19.916, + "eval_scarebleu_bp": 0.9854589677058144, + "eval_scarebleu_counts": [ + 102856, + 38824, + 16120, + 6791 + ], + "eval_scarebleu_precisions": [ + 41.630644195120375, + 16.88932584514058, + 7.578749412317818, + 3.4713489751060678 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.492615132430236, + "eval_scarebleu_sys_len": 247068, + "eval_scarebleu_totals": [ + 247068, + 229873, + 212700, + 195630 + ], + "eval_steps_per_second": 0.623, + "eval_ter_num_edits": 156588, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.7079805283717, + "step": 179000 + }, + { + "epoch": 70.31, + "learning_rate": 3.268624161073826e-05, + "loss": 1.837, + "step": 179500 + }, + { + "epoch": 70.31, + "eval_bleu_bleu": 0.09815658434781456, + "eval_bleu_brevity_penalty": 0.9576471353335374, + "eval_bleu_length_ratio": 0.9585192148699634, + "eval_bleu_precisions": [ + 0.38968015937301603, + 0.1516998106060606, + 0.06558373960276641, + 0.028468604874521193 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228395, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.827860696327214, + "eval_chrf_word_order": 2, + "eval_loss": 2.0745432376861572, + "eval_meteor": 0.3041129718759617, + "eval_runtime": 872.0653, + "eval_samples_per_second": 19.721, + "eval_scarebleu_bp": 0.9817897802933008, + "eval_scarebleu_counts": [ + 102581, + 38629, + 16071, + 6789 + ], + "eval_scarebleu_precisions": [ + 41.67198157318525, + 16.870916459942002, + 7.587926174591708, + 3.486455257414302 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.465447556375679, + "eval_scarebleu_sys_len": 246163, + "eval_scarebleu_totals": [ + 246163, + 228968, + 211797, + 194725 + ], + "eval_steps_per_second": 0.617, + "eval_ter_num_edits": 156723, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.76980249028021, + "step": 179500 + }, + { + "epoch": 70.51, + "learning_rate": 3.2636893012238454e-05, + "loss": 1.8387, + "step": 180000 + }, + { + "epoch": 70.51, + "eval_bleu_bleu": 0.09825394775736747, + "eval_bleu_brevity_penalty": 0.9605695092139387, + "eval_bleu_length_ratio": 0.9613268479387609, + "eval_bleu_precisions": [ + 0.3898211853455803, + 0.15146623621199892, + 0.0655234221325157, + 0.028294824529310782 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229064, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.89533146772041, + "eval_chrf_word_order": 2, + "eval_loss": 2.073199987411499, + "eval_meteor": 0.30527948342107253, + "eval_runtime": 876.3061, + "eval_samples_per_second": 19.626, + "eval_scarebleu_bp": 0.9875168209622288, + "eval_scarebleu_counts": [ + 102993, + 38793, + 16123, + 6787 + ], + "eval_scarebleu_precisions": [ + 41.60039098946994, + 16.838555095450165, + 7.562028047464941, + 3.4604951868167726 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.490507061356299, + "eval_scarebleu_sys_len": 247577, + "eval_scarebleu_totals": [ + 247577, + 230382, + 213210, + 196128 + ], + "eval_steps_per_second": 0.614, + "eval_ter_num_edits": 156629, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.72675608717356, + "step": 180000 + }, + { + "epoch": 70.7, + "learning_rate": 3.258754441373865e-05, + "loss": 1.8446, + "step": 180500 + }, + { + "epoch": 70.7, + "eval_bleu_bleu": 0.09784257416540261, + "eval_bleu_brevity_penalty": 0.9617553389268572, + "eval_bleu_length_ratio": 0.9624683669144155, + "eval_bleu_precisions": [ + 0.3888399553493564, + 0.15090906519720373, + 0.06515986091023787, + 0.028014746378033292 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229336, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.872657991802704, + "eval_chrf_word_order": 2, + "eval_loss": 2.0737552642822266, + "eval_meteor": 0.3039754066348473, + "eval_runtime": 876.4342, + "eval_samples_per_second": 19.623, + "eval_scarebleu_bp": 0.986987595807709, + "eval_scarebleu_counts": [ + 102804, + 38651, + 16060, + 6737 + ], + "eval_scarebleu_precisions": [ + 41.54603428626852, + 16.78646346812826, + 7.537075276891309, + 3.437157215377159 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.442856543523865, + "eval_scarebleu_sys_len": 247446, + "eval_scarebleu_totals": [ + 247446, + 230251, + 213080, + 196005 + ], + "eval_steps_per_second": 0.614, + "eval_ter_num_edits": 156892, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.84719442778051, + "step": 180500 + }, + { + "epoch": 70.9, + "learning_rate": 3.2538195815238847e-05, + "loss": 1.8517, + "step": 181000 + }, + { + "epoch": 70.9, + "eval_bleu_bleu": 0.09881390081968812, + "eval_bleu_brevity_penalty": 0.9608748151423372, + "eval_bleu_length_ratio": 0.9616206212045543, + "eval_bleu_precisions": [ + 0.390614225736905, + 0.15218529860006888, + 0.06580244378272923, + 0.02859184327934152 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229134, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.95597209748126, + "eval_chrf_word_order": 2, + "eval_loss": 2.07063364982605, + "eval_meteor": 0.305914367516995, + "eval_runtime": 903.0443, + "eval_samples_per_second": 19.044, + "eval_scarebleu_bp": 0.9852687390578014, + "eval_scarebleu_counts": [ + 103062, + 38913, + 16157, + 6835 + ], + "eval_scarebleu_precisions": [ + 41.72195886179718, + 16.931504703558343, + 7.597787956022459, + 3.494769350335927 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.530448140891847, + "eval_scarebleu_sys_len": 247021, + "eval_scarebleu_totals": [ + 247021, + 229826, + 212654, + 195578 + ], + "eval_steps_per_second": 0.596, + "eval_ter_num_edits": 156433, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.63699975729155, + "step": 181000 + }, + { + "epoch": 71.09, + "learning_rate": 3.2488945913936044e-05, + "loss": 1.8311, + "step": 181500 + }, + { + "epoch": 71.09, + "eval_bleu_bleu": 0.09864519963705456, + "eval_bleu_brevity_penalty": 0.9635706980792524, + "eval_bleu_length_ratio": 0.9642184162263565, + "eval_bleu_precisions": [ + 0.3889263687525299, + 0.15153981501519584, + 0.06548274009058573, + 0.028460891505466778 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229753, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.93124004353895, + "eval_chrf_word_order": 2, + "eval_loss": 2.0752763748168945, + "eval_meteor": 0.3054138054198664, + "eval_runtime": 878.3784, + "eval_samples_per_second": 19.579, + "eval_scarebleu_bp": 0.9894294185545867, + "eval_scarebleu_counts": [ + 103045, + 38929, + 16220, + 6853 + ], + "eval_scarebleu_precisions": [ + 41.54186034323587, + 16.862892885608346, + 7.5907189187671396, + 3.4857224239834794 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.544715961157186, + "eval_scarebleu_sys_len": 248051, + "eval_scarebleu_totals": [ + 248051, + 230856, + 213682, + 196602 + ], + "eval_steps_per_second": 0.612, + "eval_ter_num_edits": 156804, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.80689566742532, + "step": 181500 + }, + { + "epoch": 71.29, + "learning_rate": 3.243959731543624e-05, + "loss": 1.8286, + "step": 182000 + }, + { + "epoch": 71.29, + "eval_bleu_bleu": 0.09854012053683839, + "eval_bleu_brevity_penalty": 0.9625654594089544, + "eval_bleu_length_ratio": 0.9632489644492381, + "eval_bleu_precisions": [ + 0.3899321197967951, + 0.1518506831443952, + 0.06557049455842266, + 0.0282889639917811 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229522, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.97112226309719, + "eval_chrf_word_order": 2, + "eval_loss": 2.0752124786376953, + "eval_meteor": 0.3057049351063431, + "eval_runtime": 930.3188, + "eval_samples_per_second": 18.486, + "eval_scarebleu_bp": 0.9882798724592111, + "eval_scarebleu_counts": [ + 103132, + 38944, + 16154, + 6782 + ], + "eval_scarebleu_precisions": [ + 41.624758845039274, + 16.890242051255363, + 7.569892876221895, + 3.4545287843440877 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.507910850299815, + "eval_scarebleu_sys_len": 247766, + "eval_scarebleu_totals": [ + 247766, + 230571, + 213398, + 196322 + ], + "eval_steps_per_second": 0.578, + "eval_ter_num_edits": 156578, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.70340112378588, + "step": 182000 + }, + { + "epoch": 71.48, + "learning_rate": 3.239024871693644e-05, + "loss": 1.83, + "step": 182500 + }, + { + "epoch": 71.48, + "eval_bleu_bleu": 0.09879059194668904, + "eval_bleu_brevity_penalty": 0.9625611056105782, + "eval_bleu_length_ratio": 0.9632447676882981, + "eval_bleu_precisions": [ + 0.38890994723794337, + 0.15187494701543852, + 0.06570917643200812, + 0.028588271622266515 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229521, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.00868924592813, + "eval_chrf_word_order": 2, + "eval_loss": 2.071213483810425, + "eval_meteor": 0.30506795755673566, + "eval_runtime": 941.0466, + "eval_samples_per_second": 18.275, + "eval_scarebleu_bp": 0.9873431363193412, + "eval_scarebleu_counts": [ + 102917, + 38930, + 16198, + 6846 + ], + "eval_scarebleu_precisions": [ + 41.57691468646731, + 16.901176092628692, + 7.598808434780569, + 3.4914142624731617 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.537112490236838, + "eval_scarebleu_sys_len": 247534, + "eval_scarebleu_totals": [ + 247534, + 230339, + 213165, + 196081 + ], + "eval_steps_per_second": 0.572, + "eval_ter_num_edits": 156749, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.78170894220334, + "step": 182500 + }, + { + "epoch": 71.68, + "learning_rate": 3.234090011843664e-05, + "loss": 1.8396, + "step": 183000 + }, + { + "epoch": 71.68, + "eval_bleu_bleu": 0.09891316236288969, + "eval_bleu_brevity_penalty": 0.9624870882465976, + "eval_bleu_length_ratio": 0.9631734227523198, + "eval_bleu_precisions": [ + 0.38965769659788063, + 0.1519106585213062, + 0.06566743530617473, + 0.02869558870591934 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229504, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.9939527176431, + "eval_chrf_word_order": 2, + "eval_loss": 2.069362163543701, + "eval_meteor": 0.3051308217791897, + "eval_runtime": 926.4233, + "eval_samples_per_second": 18.564, + "eval_scarebleu_bp": 0.9869471855804522, + "eval_scarebleu_counts": [ + 102981, + 38875, + 16172, + 6846 + ], + "eval_scarebleu_precisions": [ + 41.61924699720332, + 16.88448191243089, + 7.5900651435222555, + 3.4929106057745782 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.530486877714456, + "eval_scarebleu_sys_len": 247436, + "eval_scarebleu_totals": [ + 247436, + 230241, + 213068, + 195997 + ], + "eval_steps_per_second": 0.581, + "eval_ter_num_edits": 156604, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.715307575709, + "step": 183000 + }, + { + "epoch": 71.88, + "learning_rate": 3.229165021713383e-05, + "loss": 1.8378, + "step": 183500 + }, + { + "epoch": 71.88, + "eval_bleu_bleu": 0.09904054562932313, + "eval_bleu_brevity_penalty": 0.959338655090597, + "eval_bleu_length_ratio": 0.9601433613537073, + "eval_bleu_precisions": [ + 0.3909442176394996, + 0.15272204814095383, + 0.06607107037602802, + 0.028796283768547332 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228782, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.01235952578372, + "eval_chrf_word_order": 2, + "eval_loss": 2.068675994873047, + "eval_meteor": 0.30620907491810523, + "eval_runtime": 947.7539, + "eval_samples_per_second": 18.146, + "eval_scarebleu_bp": 0.9864904379901286, + "eval_scarebleu_counts": [ + 103187, + 39086, + 16274, + 6881 + ], + "eval_scarebleu_precisions": [ + 41.721554404564074, + 16.98446082180352, + 7.642025977441137, + 3.512972625259095 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.58555278015184, + "eval_scarebleu_sys_len": 247323, + "eval_scarebleu_totals": [ + 247323, + 230128, + 212954, + 195874 + ], + "eval_steps_per_second": 0.568, + "eval_ter_num_edits": 156427, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.63425211454006, + "step": 183500 + }, + { + "epoch": 72.07, + "learning_rate": 3.224230161863403e-05, + "loss": 1.8311, + "step": 184000 + }, + { + "epoch": 72.07, + "eval_bleu_bleu": 0.09899243212835698, + "eval_bleu_brevity_penalty": 0.9607178118490906, + "eval_bleu_length_ratio": 0.9614695378107176, + "eval_bleu_precisions": [ + 0.39030022086617955, + 0.1523338508657263, + 0.0661134532532954, + 0.0286773850456666 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229098, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.94659572174669, + "eval_chrf_word_order": 2, + "eval_loss": 2.0698018074035645, + "eval_meteor": 0.3057568499399812, + "eval_runtime": 954.684, + "eval_samples_per_second": 18.014, + "eval_scarebleu_bp": 0.98741988436949, + "eval_scarebleu_counts": [ + 103107, + 38963, + 16248, + 6861 + ], + "eval_scarebleu_precisions": [ + 41.650474847810365, + 16.91410760642131, + 7.621585109576704, + 3.498618094295942 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.559913666813245, + "eval_scarebleu_sys_len": 247553, + "eval_scarebleu_totals": [ + 247553, + 230358, + 213184, + 196106 + ], + "eval_steps_per_second": 0.564, + "eval_ter_num_edits": 156503, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.66905558939227, + "step": 184000 + }, + { + "epoch": 72.27, + "learning_rate": 3.219295302013423e-05, + "loss": 1.8167, + "step": 184500 + }, + { + "epoch": 72.27, + "eval_bleu_bleu": 0.09929113632351481, + "eval_bleu_brevity_penalty": 0.9612018292815547, + "eval_bleu_length_ratio": 0.9619353782750473, + "eval_bleu_precisions": [ + 0.39027263327356254, + 0.15248521324063505, + 0.06622428189455641, + 0.02889152601474666 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229209, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.057655866016425, + "eval_chrf_word_order": 2, + "eval_loss": 2.0716052055358887, + "eval_meteor": 0.30556375092439725, + "eval_runtime": 943.6593, + "eval_samples_per_second": 18.225, + "eval_scarebleu_bp": 0.9844507545451862, + "eval_scarebleu_counts": [ + 102887, + 38950, + 16248, + 6895 + ], + "eval_scarebleu_precisions": [ + 41.68520251682407, + 16.96251262934188, + 7.647917156978113, + 3.5292551966299324 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.57093837433288, + "eval_scarebleu_sys_len": 246819, + "eval_scarebleu_totals": [ + 246819, + 229624, + 212450, + 195367 + ], + "eval_steps_per_second": 0.57, + "eval_ter_num_edits": 156555, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.6928684932385, + "step": 184500 + }, + { + "epoch": 72.46, + "learning_rate": 3.214360442163443e-05, + "loss": 1.8223, + "step": 185000 + }, + { + "epoch": 72.46, + "eval_bleu_bleu": 0.09910733721606768, + "eval_bleu_brevity_penalty": 0.9591595800060209, + "eval_bleu_length_ratio": 0.959971294155171, + "eval_bleu_precisions": [ + 0.3902710926331528, + 0.1526901950403222, + 0.06625579397375285, + 0.02887076947367234 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228741, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.98247149733688, + "eval_chrf_word_order": 2, + "eval_loss": 2.07300066947937, + "eval_meteor": 0.30565768867428944, + "eval_runtime": 947.178, + "eval_samples_per_second": 18.157, + "eval_scarebleu_bp": 0.9863893598268638, + "eval_scarebleu_counts": [ + 103022, + 39079, + 16298, + 6889 + ], + "eval_scarebleu_precisions": [ + 41.65905102346157, + 16.98326401654911, + 7.654230538022242, + 3.517433993862744 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.588117391051442, + "eval_scarebleu_sys_len": 247298, + "eval_scarebleu_totals": [ + 247298, + 230103, + 212928, + 195853 + ], + "eval_steps_per_second": 0.568, + "eval_ter_num_edits": 156493, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.66447618480645, + "step": 185000 + }, + { + "epoch": 72.66, + "learning_rate": 3.209425582313462e-05, + "loss": 1.8316, + "step": 185500 + }, + { + "epoch": 72.66, + "eval_bleu_bleu": 0.09913073974939668, + "eval_bleu_brevity_penalty": 0.9579445519020838, + "eval_bleu_length_ratio": 0.958804594613877, + "eval_bleu_precisions": [ + 0.3914594485759182, + 0.15298104776871083, + 0.06644307749374054, + 0.028820250419342268 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228463, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 33.98047677068989, + "eval_chrf_word_order": 2, + "eval_loss": 2.066375970840454, + "eval_meteor": 0.3056258855314223, + "eval_runtime": 939.3798, + "eval_samples_per_second": 18.308, + "eval_scarebleu_bp": 0.9835429117601426, + "eval_scarebleu_counts": [ + 103025, + 38970, + 16256, + 6879 + ], + "eval_scarebleu_precisions": [ + 41.77903039396581, + 16.987794245858762, + 7.659758936228361, + 3.5249807840122984 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.572045005432432, + "eval_scarebleu_sys_len": 246595, + "eval_scarebleu_totals": [ + 246595, + 229400, + 212226, + 195150 + ], + "eval_steps_per_second": 0.573, + "eval_ter_num_edits": 156328, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.58891600914049, + "step": 185500 + }, + { + "epoch": 72.86, + "learning_rate": 3.204500592183182e-05, + "loss": 1.8329, + "step": 186000 + }, + { + "epoch": 72.86, + "eval_bleu_bleu": 0.09971306145753535, + "eval_bleu_brevity_penalty": 0.9640055645941688, + "eval_bleu_length_ratio": 0.9646380923203471, + "eval_bleu_precisions": [ + 0.39006234419389785, + 0.15272879459037517, + 0.06640033555673773, + 0.02893775356958734 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229853, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.06298079804643, + "eval_chrf_word_order": 2, + "eval_loss": 2.0665056705474854, + "eval_meteor": 0.3063966466674727, + "eval_runtime": 942.3117, + "eval_samples_per_second": 18.251, + "eval_scarebleu_bp": 0.9882637291784402, + "eval_scarebleu_counts": [ + 103210, + 39118, + 16351, + 6930 + ], + "eval_scarebleu_precisions": [ + 41.65691268233224, + 16.96600120572328, + 7.662388175807079, + 3.5300769689220783 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.620547247512635, + "eval_scarebleu_sys_len": 247762, + "eval_scarebleu_totals": [ + 247762, + 230567, + 213393, + 196313 + ], + "eval_steps_per_second": 0.571, + "eval_ter_num_edits": 156460, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.64936414967326, + "step": 186000 + }, + { + "epoch": 73.05, + "learning_rate": 3.199565732333202e-05, + "loss": 1.8269, + "step": 186500 + }, + { + "epoch": 73.05, + "eval_bleu_bleu": 0.09969490241455958, + "eval_bleu_brevity_penalty": 0.9585915775317704, + "eval_bleu_length_ratio": 0.9594257152329831, + "eval_bleu_precisions": [ + 0.3918840300772929, + 0.15355980625875051, + 0.0666646075282102, + 0.029162646081269433 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228611, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.09599541966476, + "eval_chrf_word_order": 2, + "eval_loss": 2.0683391094207764, + "eval_meteor": 0.30692710447215826, + "eval_runtime": 935.0328, + "eval_samples_per_second": 18.393, + "eval_scarebleu_bp": 0.9834942544349978, + "eval_scarebleu_counts": [ + 103138, + 39131, + 16340, + 6914 + ], + "eval_scarebleu_precisions": [ + 41.8268899315849, + 17.05886968803948, + 7.699738472775252, + 3.5431154202901523 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.61685589401894, + "eval_scarebleu_sys_len": 246583, + "eval_scarebleu_totals": [ + 246583, + 229388, + 212215, + 195139 + ], + "eval_steps_per_second": 0.575, + "eval_ter_num_edits": 156187, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.52434640448048, + "step": 186500 + }, + { + "epoch": 73.25, + "learning_rate": 3.194630872483222e-05, + "loss": 1.8021, + "step": 187000 + }, + { + "epoch": 73.25, + "eval_bleu_bleu": 0.09830035014100522, + "eval_bleu_brevity_penalty": 0.958062620279315, + "eval_bleu_length_ratio": 0.9589179071592545, + "eval_bleu_precisions": [ + 0.3916582782616307, + 0.1523746420880759, + 0.06569655136889278, + 0.028267154537651894 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228490, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.05606619046791, + "eval_chrf_word_order": 2, + "eval_loss": 2.070355176925659, + "eval_meteor": 0.30572842034885916, + "eval_runtime": 935.1351, + "eval_samples_per_second": 18.391, + "eval_scarebleu_bp": 0.9825733812624489, + "eval_scarebleu_counts": [ + 103009, + 38859, + 16103, + 6775 + ], + "eval_scarebleu_precisions": [ + 41.81306726850574, + 16.95707384764423, + 7.596148856780305, + 3.4758740989662162 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.493309589351256, + "eval_scarebleu_sys_len": 246356, + "eval_scarebleu_totals": [ + 246356, + 229161, + 211989, + 194915 + ], + "eval_steps_per_second": 0.575, + "eval_ter_num_edits": 156366, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.60631774656659, + "step": 187000 + }, + { + "epoch": 73.44, + "learning_rate": 3.1896960126332417e-05, + "loss": 1.8138, + "step": 187500 + }, + { + "epoch": 73.44, + "eval_bleu_bleu": 0.09934848826583133, + "eval_bleu_brevity_penalty": 0.9562858116675693, + "eval_bleu_length_ratio": 0.9572140222176524, + "eval_bleu_precisions": [ + 0.3922765296995844, + 0.1535357462930736, + 0.06668077572278802, + 0.029006259692335556 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228084, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.055922627417644, + "eval_chrf_word_order": 2, + "eval_loss": 2.067139148712158, + "eval_meteor": 0.3062189187427121, + "eval_runtime": 937.5802, + "eval_samples_per_second": 18.343, + "eval_scarebleu_bp": 0.9846897389443398, + "eval_scarebleu_counts": [ + 103302, + 39158, + 16350, + 6922 + ], + "eval_scarebleu_precisions": [ + 41.84333962524, + 17.04871496802114, + 7.693755587972331, + 3.541860679308616 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.627099115000139, + "eval_scarebleu_sys_len": 246878, + "eval_scarebleu_totals": [ + 246878, + 229683, + 212510, + 195434 + ], + "eval_steps_per_second": 0.574, + "eval_ter_num_edits": 156214, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.5367107968622, + "step": 187500 + }, + { + "epoch": 73.64, + "learning_rate": 3.1847808922226615e-05, + "loss": 1.8178, + "step": 188000 + }, + { + "epoch": 73.64, + "eval_bleu_bleu": 0.09940096932759748, + "eval_bleu_brevity_penalty": 0.9661077445263203, + "eval_bleu_length_ratio": 0.9666693246152619, + "eval_bleu_precisions": [ + 0.38963779158363615, + 0.15235382984113877, + 0.06590569301499666, + 0.028643286293139582 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230337, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.04596610395175, + "eval_chrf_word_order": 2, + "eval_loss": 2.065434455871582, + "eval_meteor": 0.3058162109741586, + "eval_runtime": 933.8491, + "eval_samples_per_second": 18.416, + "eval_scarebleu_bp": 0.9910929348545177, + "eval_scarebleu_counts": [ + 103448, + 39136, + 16292, + 6892 + ], + "eval_scarebleu_precisions": [ + 41.63500547362998, + 16.922285304126365, + 7.6097770595021785, + 3.4982995787015887 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.598478527143604, + "eval_scarebleu_sys_len": 248464, + "eval_scarebleu_totals": [ + 248464, + 231269, + 214093, + 197010 + ], + "eval_steps_per_second": 0.576, + "eval_ter_num_edits": 156631, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.72767196809072, + "step": 188000 + }, + { + "epoch": 73.83, + "learning_rate": 3.179846032372681e-05, + "loss": 1.8214, + "step": 188500 + }, + { + "epoch": 73.83, + "eval_bleu_bleu": 0.09934271340301296, + "eval_bleu_brevity_penalty": 0.9623433924275707, + "eval_bleu_length_ratio": 0.9630349296413029, + "eval_bleu_precisions": [ + 0.3907073224939099, + 0.15308372119316363, + 0.06620266204712141, + 0.02867924952126375 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229471, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.14768271984729, + "eval_chrf_word_order": 2, + "eval_loss": 2.0671374797821045, + "eval_meteor": 0.3073604531467471, + "eval_runtime": 938.8638, + "eval_samples_per_second": 18.318, + "eval_scarebleu_bp": 0.9896511104017215, + "eval_scarebleu_counts": [ + 103432, + 39292, + 16362, + 6885 + ], + "eval_scarebleu_precisions": [ + 41.68863308424625, + 17.01607978831671, + 7.655202421667751, + 3.500948332409578 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.620826135483538, + "eval_scarebleu_sys_len": 248106, + "eval_scarebleu_totals": [ + 248106, + 230911, + 213737, + 196661 + ], + "eval_steps_per_second": 0.573, + "eval_ter_num_edits": 156342, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.59532717556063, + "step": 188500 + }, + { + "epoch": 74.03, + "learning_rate": 3.1749111725227e-05, + "loss": 1.837, + "step": 189000 + }, + { + "epoch": 74.03, + "eval_bleu_bleu": 0.09915605357994811, + "eval_bleu_brevity_penalty": 0.9599280752221349, + "eval_bleu_length_ratio": 0.9607099240805946, + "eval_bleu_precisions": [ + 0.3920591306019212, + 0.1530119685247636, + 0.06609752211388716, + 0.028711772559048686 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228917, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.069089634705435, + "eval_chrf_word_order": 2, + "eval_loss": 2.0624337196350098, + "eval_meteor": 0.3068972878340172, + "eval_runtime": 915.0454, + "eval_samples_per_second": 18.795, + "eval_scarebleu_bp": 0.9873552548191804, + "eval_scarebleu_counts": [ + 103533, + 39137, + 16259, + 6864 + ], + "eval_scarebleu_precisions": [ + 41.82526248601219, + 16.99082234242995, + 7.6272816403886115, + 3.5003263707571803 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.58794142254493, + "eval_scarebleu_sys_len": 247537, + "eval_scarebleu_totals": [ + 247537, + 230342, + 213169, + 196096 + ], + "eval_steps_per_second": 0.588, + "eval_ter_num_edits": 156171, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.51701935714318, + "step": 189000 + }, + { + "epoch": 74.23, + "learning_rate": 3.16997631267272e-05, + "loss": 1.7974, + "step": 189500 + }, + { + "epoch": 74.23, + "eval_bleu_bleu": 0.09956115725023415, + "eval_bleu_brevity_penalty": 0.9607963164560454, + "eval_bleu_length_ratio": 0.961545079507636, + "eval_bleu_precisions": [ + 0.39125595768082544, + 0.15331184733933872, + 0.0664099404395153, + 0.028944406932252982 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229116, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.08872057981793, + "eval_chrf_word_order": 2, + "eval_loss": 2.066352605819702, + "eval_meteor": 0.3065616582326905, + "eval_runtime": 1043.9771, + "eval_samples_per_second": 16.474, + "eval_scarebleu_bp": 0.987379491383863, + "eval_scarebleu_counts": [ + 103375, + 39227, + 16366, + 6928 + ], + "eval_scarebleu_precisions": [ + 41.76042142173279, + 17.029451091392154, + 7.677260466752668, + 3.5328373354818643 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.636113856871809, + "eval_scarebleu_sys_len": 247543, + "eval_scarebleu_totals": [ + 247543, + 230348, + 213175, + 196103 + ], + "eval_steps_per_second": 0.515, + "eval_ter_num_edits": 156342, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.59532717556063, + "step": 189500 + }, + { + "epoch": 74.42, + "learning_rate": 3.16504145282274e-05, + "loss": 1.8111, + "step": 190000 + }, + { + "epoch": 74.42, + "eval_bleu_bleu": 0.09926128748954138, + "eval_bleu_brevity_penalty": 0.9638272913665158, + "eval_bleu_length_ratio": 0.964466025121811, + "eval_bleu_precisions": [ + 0.3907193706159818, + 0.15280527897581098, + 0.06614754140296843, + 0.028484311769255775 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229812, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.14526089426623, + "eval_chrf_word_order": 2, + "eval_loss": 2.066035509109497, + "eval_meteor": 0.307318531321858, + "eval_runtime": 1056.2446, + "eval_samples_per_second": 16.282, + "eval_scarebleu_bp": 0.9901225476848173, + "eval_scarebleu_counts": [ + 103517, + 39214, + 16318, + 6855 + ], + "eval_scarebleu_precisions": [ + 41.70322653420513, + 16.97370015755666, + 7.6304037782609715, + 3.483656543480912 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.596347183475316, + "eval_scarebleu_sys_len": 248223, + "eval_scarebleu_totals": [ + 248223, + 231028, + 213855, + 196776 + ], + "eval_steps_per_second": 0.509, + "eval_ter_num_edits": 156315, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.58296278317893, + "step": 190000 + }, + { + "epoch": 74.62, + "learning_rate": 3.16010659297276e-05, + "loss": 1.8102, + "step": 190500 + }, + { + "epoch": 74.62, + "eval_bleu_bleu": 0.09925053299985517, + "eval_bleu_brevity_penalty": 0.9593779601385177, + "eval_bleu_length_ratio": 0.9601811322021664, + "eval_bleu_precisions": [ + 0.39213955094387454, + 0.1533110266734721, + 0.06632618948429536, + 0.028725880913861815 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228791, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.14691917790121, + "eval_chrf_word_order": 2, + "eval_loss": 2.060333728790283, + "eval_meteor": 0.30736448675815903, + "eval_runtime": 1045.9428, + "eval_samples_per_second": 16.443, + "eval_scarebleu_bp": 0.9840496204630725, + "eval_scarebleu_counts": [ + 103313, + 39089, + 16249, + 6812 + ], + "eval_scarebleu_precisions": [ + 41.87459468223087, + 17.03038884653088, + 7.6519536051160575, + 3.488270868431968 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.558631696188748, + "eval_scarebleu_sys_len": 246720, + "eval_scarebleu_totals": [ + 246720, + 229525, + 212351, + 195283 + ], + "eval_steps_per_second": 0.514, + "eval_ter_num_edits": 156192, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.5266361067734, + "step": 190500 + }, + { + "epoch": 74.81, + "learning_rate": 3.1551717331227794e-05, + "loss": 1.8215, + "step": 191000 + }, + { + "epoch": 74.81, + "eval_bleu_bleu": 0.09963667836680133, + "eval_bleu_brevity_penalty": 0.9585041650762318, + "eval_bleu_length_ratio": 0.959341780014185, + "eval_bleu_precisions": [ + 0.391865821489035, + 0.15348918617192378, + 0.06672844749916339, + 0.029092078827964513 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228591, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.12472757255265, + "eval_chrf_word_order": 2, + "eval_loss": 2.0610358715057373, + "eval_meteor": 0.3066651692815991, + "eval_runtime": 1060.2059, + "eval_samples_per_second": 16.221, + "eval_scarebleu_bp": 0.9832387652725239, + "eval_scarebleu_counts": [ + 103124, + 39127, + 16350, + 6933 + ], + "eval_scarebleu_precisions": [ + 41.83190004867759, + 17.06181183909299, + 7.706738564802595, + 3.553908376520522 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.626162558263655, + "eval_scarebleu_sys_len": 246520, + "eval_scarebleu_totals": [ + 246520, + 229325, + 212152, + 195081 + ], + "eval_steps_per_second": 0.507, + "eval_ter_num_edits": 156259, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.55731811749835, + "step": 191000 + }, + { + "epoch": 75.01, + "learning_rate": 3.1502368732728e-05, + "loss": 1.8072, + "step": 191500 + }, + { + "epoch": 75.01, + "eval_bleu_bleu": 0.09969100927753802, + "eval_bleu_brevity_penalty": 0.9618860462332512, + "eval_bleu_length_ratio": 0.9625942697426126, + "eval_bleu_precisions": [ + 0.39168403337896635, + 0.15354596056954062, + 0.06643829996718083, + 0.028875977703856873 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229366, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.23342883383066, + "eval_chrf_word_order": 2, + "eval_loss": 2.061901807785034, + "eval_meteor": 0.3081527016964595, + "eval_runtime": 1096.3539, + "eval_samples_per_second": 15.687, + "eval_scarebleu_bp": 0.9879004372635075, + "eval_scarebleu_counts": [ + 103519, + 39354, + 16402, + 6906 + ], + "eval_scarebleu_precisions": [ + 41.79681191252948, + 17.075022670374917, + 7.689566905139192, + 3.5193754204292964 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.646117252572495, + "eval_scarebleu_sys_len": 247672, + "eval_scarebleu_totals": [ + 247672, + 230477, + 213302, + 196228 + ], + "eval_steps_per_second": 0.491, + "eval_ter_num_edits": 156276, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.56510310529424, + "step": 191500 + }, + { + "epoch": 75.21, + "learning_rate": 3.145311883142519e-05, + "loss": 1.7871, + "step": 192000 + }, + { + "epoch": 75.21, + "eval_bleu_bleu": 0.09994747113507425, + "eval_bleu_brevity_penalty": 0.9630050990758918, + "eval_bleu_length_ratio": 0.9636728373041686, + "eval_bleu_precisions": [ + 0.39281343767828136, + 0.15384036002786827, + 0.06649937264742785, + 0.028873452807110074 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229623, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.15778377640217, + "eval_chrf_word_order": 2, + "eval_loss": 2.0622265338897705, + "eval_meteor": 0.30856366851498174, + "eval_runtime": 1061.2217, + "eval_samples_per_second": 16.206, + "eval_scarebleu_bp": 0.9890544471350722, + "eval_scarebleu_counts": [ + 103860, + 39415, + 16421, + 6914 + ], + "eval_scarebleu_precisions": [ + 41.88612587615645, + 17.080294501284868, + 7.6881300066951015, + 3.5183243941907447 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.665429587063937, + "eval_scarebleu_sys_len": 247958, + "eval_scarebleu_totals": [ + 247958, + 230763, + 213589, + 196514 + ], + "eval_steps_per_second": 0.507, + "eval_ter_num_edits": 156020, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.44787034789736, + "step": 192000 + }, + { + "epoch": 75.4, + "learning_rate": 3.140377023292539e-05, + "loss": 1.7974, + "step": 192500 + }, + { + "epoch": 75.4, + "eval_bleu_bleu": 0.09992002640479987, + "eval_bleu_brevity_penalty": 0.9596530539807011, + "eval_bleu_length_ratio": 0.9604455281413805, + "eval_bleu_precisions": [ + 0.39185681700997144, + 0.15353941953803052, + 0.06681885488647582, + 0.029235251356666686 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228854, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.13103338067553, + "eval_chrf_word_order": 2, + "eval_loss": 2.061849594116211, + "eval_meteor": 0.30709480458393884, + "eval_runtime": 1083.1629, + "eval_samples_per_second": 15.878, + "eval_scarebleu_bp": 0.9830318936939101, + "eval_scarebleu_counts": [ + 103132, + 39107, + 16329, + 6936 + ], + "eval_scarebleu_precisions": [ + 41.84380185743441, + 17.056883903102836, + 7.698727015558699, + 3.556430648064114 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.622742927881783, + "eval_scarebleu_sys_len": 246469, + "eval_scarebleu_totals": [ + 246469, + 229274, + 212100, + 195027 + ], + "eval_steps_per_second": 0.497, + "eval_ter_num_edits": 156165, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.5142717143917, + "step": 192500 + }, + { + "epoch": 75.6, + "learning_rate": 3.135452033162258e-05, + "loss": 1.8077, + "step": 193000 + }, + { + "epoch": 75.6, + "eval_bleu_bleu": 0.100228179579133, + "eval_bleu_brevity_penalty": 0.9615897527488527, + "eval_bleu_length_ratio": 0.962308889998699, + "eval_bleu_precisions": [ + 0.39161702239007756, + 0.15390635681720674, + 0.06705071251962122, + 0.029206434858858047 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229298, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.17167544811584, + "eval_chrf_word_order": 2, + "eval_loss": 2.0615789890289307, + "eval_meteor": 0.3074877008847816, + "eval_runtime": 1099.8001, + "eval_samples_per_second": 15.637, + "eval_scarebleu_bp": 0.9867491521681152, + "eval_scarebleu_counts": [ + 103427, + 39359, + 16447, + 6973 + ], + "eval_scarebleu_precisions": [ + 41.80777486286668, + 17.09833530270383, + 7.720907524680897, + 3.5585971788433666 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.68143718399606, + "eval_scarebleu_sys_len": 247387, + "eval_scarebleu_totals": [ + 247387, + 230192, + 213019, + 195948 + ], + "eval_steps_per_second": 0.489, + "eval_ter_num_edits": 156214, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.5367107968622, + "step": 193000 + }, + { + "epoch": 75.79, + "learning_rate": 3.130517173312278e-05, + "loss": 1.8054, + "step": 193500 + }, + { + "epoch": 75.79, + "eval_bleu_bleu": 0.10032256690154161, + "eval_bleu_brevity_penalty": 0.9608966192822939, + "eval_bleu_length_ratio": 0.9616416050092539, + "eval_bleu_precisions": [ + 0.39105521102911334, + 0.15370569584418525, + 0.06723344833251191, + 0.029401836348906293 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229139, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.16668047374577, + "eval_chrf_word_order": 2, + "eval_loss": 2.059645891189575, + "eval_meteor": 0.30711795218655463, + "eval_runtime": 1098.6482, + "eval_samples_per_second": 15.654, + "eval_scarebleu_bp": 0.9851432495816728, + "eval_scarebleu_counts": [ + 103172, + 39199, + 16498, + 7019 + ], + "eval_scarebleu_precisions": [ + 41.771731649054615, + 17.058247568484955, + 7.759273455834975, + 3.589436756568787 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.692717302982155, + "eval_scarebleu_sys_len": 246990, + "eval_scarebleu_totals": [ + 246990, + 229795, + 212623, + 195546 + ], + "eval_steps_per_second": 0.49, + "eval_ter_num_edits": 156399, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.62142978169979, + "step": 193500 + }, + { + "epoch": 75.99, + "learning_rate": 3.125582313462298e-05, + "loss": 1.8155, + "step": 194000 + }, + { + "epoch": 75.99, + "eval_bleu_bleu": 0.10009301821140741, + "eval_bleu_brevity_penalty": 0.9616071841145288, + "eval_bleu_length_ratio": 0.9623256770424586, + "eval_bleu_precisions": [ + 0.39125258392861817, + 0.15353571546436467, + 0.06679285545740872, + 0.029256858920672035 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229302, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.19595478809996, + "eval_chrf_word_order": 2, + "eval_loss": 2.058773994445801, + "eval_meteor": 0.307208705183779, + "eval_runtime": 1098.3136, + "eval_samples_per_second": 15.659, + "eval_scarebleu_bp": 0.9890947733167788, + "eval_scarebleu_counts": [ + 103475, + 39364, + 16491, + 7036 + ], + "eval_scarebleu_precisions": [ + 41.72917473222351, + 17.05745472823944, + 7.720469473457522, + 3.580169645901072 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.714216377451484, + "eval_scarebleu_sys_len": 247968, + "eval_scarebleu_totals": [ + 247968, + 230773, + 213601, + 196527 + ], + "eval_steps_per_second": 0.49, + "eval_ter_num_edits": 156363, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.60494392519084, + "step": 194000 + }, + { + "epoch": 76.18, + "learning_rate": 3.120647453612318e-05, + "loss": 1.7885, + "step": 194500 + }, + { + "epoch": 76.18, + "eval_bleu_bleu": 0.10007139901674392, + "eval_bleu_brevity_penalty": 0.9636315903635873, + "eval_bleu_length_ratio": 0.9642771708795151, + "eval_bleu_precisions": [ + 0.3913573315576214, + 0.15355267862183167, + 0.06664449107005782, + 0.029040269547521206 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229767, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.25679388130214, + "eval_chrf_word_order": 2, + "eval_loss": 2.0593748092651367, + "eval_meteor": 0.3079161334349175, + "eval_runtime": 1099.8967, + "eval_samples_per_second": 15.636, + "eval_scarebleu_bp": 0.9875975943683966, + "eval_scarebleu_counts": [ + 103506, + 39287, + 16406, + 6936 + ], + "eval_scarebleu_precisions": [ + 41.804222183629044, + 17.05150128905131, + 7.694075383742361, + 3.5359431475807646 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.6544328370353, + "eval_scarebleu_sys_len": 247597, + "eval_scarebleu_totals": [ + 247597, + 230402, + 213229, + 196157 + ], + "eval_steps_per_second": 0.489, + "eval_ter_num_edits": 156265, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.56006576024984, + "step": 194500 + }, + { + "epoch": 76.38, + "learning_rate": 3.1157125937623374e-05, + "loss": 1.7927, + "step": 195000 + }, + { + "epoch": 76.38, + "eval_bleu_bleu": 0.10021778523913702, + "eval_bleu_brevity_penalty": 0.9620994994997717, + "eval_bleu_length_ratio": 0.962799911028668, + "eval_bleu_precisions": [ + 0.39097269141076213, + 0.15355762887569505, + 0.0668266199111029, + 0.02934485257357278 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229415, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.18551544473243, + "eval_chrf_word_order": 2, + "eval_loss": 2.060504198074341, + "eval_meteor": 0.30729520318300574, + "eval_runtime": 1085.7682, + "eval_samples_per_second": 15.839, + "eval_scarebleu_bp": 0.9889657238734362, + "eval_scarebleu_counts": [ + 103461, + 39327, + 16465, + 7014 + ], + "eval_scarebleu_precisions": [ + 41.72891391326794, + 17.043785023034484, + 7.709524411542982, + 3.569538311212442 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.69746975564498, + "eval_scarebleu_sys_len": 247936, + "eval_scarebleu_totals": [ + 247936, + 230741, + 213567, + 196496 + ], + "eval_steps_per_second": 0.496, + "eval_ter_num_edits": 156253, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.55457047474687, + "step": 195000 + }, + { + "epoch": 76.58, + "learning_rate": 3.110777733912357e-05, + "loss": 1.799, + "step": 195500 + }, + { + "epoch": 76.58, + "eval_bleu_bleu": 0.10043147057658337, + "eval_bleu_brevity_penalty": 0.9635924457338001, + "eval_bleu_length_ratio": 0.964239400031056, + "eval_bleu_precisions": [ + 0.39182095944428486, + 0.1537520640939392, + 0.06695427887125004, + 0.029256258585405513 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229758, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.2462427621209, + "eval_chrf_word_order": 2, + "eval_loss": 2.0579581260681152, + "eval_meteor": 0.30822428151732867, + "eval_runtime": 1049.2889, + "eval_samples_per_second": 16.39, + "eval_scarebleu_bp": 0.9872825416450992, + "eval_scarebleu_counts": [ + 103531, + 39335, + 16474, + 6980 + ], + "eval_scarebleu_precisions": [ + 41.82749607100869, + 17.07811604522325, + 7.728793202940638, + 3.5598986091914746 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.689723617848172, + "eval_scarebleu_sys_len": 247519, + "eval_scarebleu_totals": [ + 247519, + 230324, + 213151, + 196073 + ], + "eval_steps_per_second": 0.513, + "eval_ter_num_edits": 156172, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.51747729760176, + "step": 195500 + }, + { + "epoch": 76.77, + "learning_rate": 3.1058428740623766e-05, + "loss": 1.7901, + "step": 196000 + }, + { + "epoch": 76.77, + "eval_bleu_bleu": 0.10040682674102325, + "eval_bleu_brevity_penalty": 0.9608093999815734, + "eval_bleu_length_ratio": 0.9615576697904558, + "eval_bleu_precisions": [ + 0.391735299124036, + 0.15405994601838394, + 0.06713835347757777, + 0.029434106651511655 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229119, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.25395725723878, + "eval_chrf_word_order": 2, + "eval_loss": 2.0584189891815186, + "eval_meteor": 0.30757907321440364, + "eval_runtime": 1089.447, + "eval_samples_per_second": 15.786, + "eval_scarebleu_bp": 0.9851756354478926, + "eval_scarebleu_counts": [ + 103302, + 39328, + 16490, + 7011 + ], + "eval_scarebleu_precisions": [ + 41.82301071263735, + 17.113788766900345, + 7.755255608333726, + 3.58519897317365 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.701226141728272, + "eval_scarebleu_sys_len": 246998, + "eval_scarebleu_totals": [ + 246998, + 229803, + 212630, + 195554 + ], + "eval_steps_per_second": 0.494, + "eval_ter_num_edits": 156050, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.46160856165481, + "step": 196000 + }, + { + "epoch": 76.97, + "learning_rate": 3.100908014212396e-05, + "loss": 1.8056, + "step": 196500 + }, + { + "epoch": 76.97, + "eval_bleu_bleu": 0.10004842802060726, + "eval_bleu_brevity_penalty": 0.9579620443561749, + "eval_bleu_length_ratio": 0.9588213816576366, + "eval_bleu_precisions": [ + 0.39342662178782933, + 0.15424192510129123, + 0.06699259701923127, + 0.029265427601669405 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228467, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.18408901407534, + "eval_chrf_word_order": 2, + "eval_loss": 2.05129337310791, + "eval_meteor": 0.3079807739559082, + "eval_runtime": 1096.4512, + "eval_samples_per_second": 15.685, + "eval_scarebleu_bp": 0.9821674456846616, + "eval_scarebleu_counts": [ + 103440, + 39267, + 16409, + 6958 + ], + "eval_scarebleu_precisions": [ + 42.005067896822815, + 17.142595203897653, + 7.744149059177211, + 3.5715935631239892 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.667801560347197, + "eval_scarebleu_sys_len": 246256, + "eval_scarebleu_totals": [ + 246256, + 229061, + 211889, + 194815 + ], + "eval_steps_per_second": 0.491, + "eval_ter_num_edits": 155946, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.41398275396233, + "step": 196500 + }, + { + "epoch": 77.16, + "learning_rate": 3.095983024082117e-05, + "loss": 1.7814, + "step": 197000 + }, + { + "epoch": 77.16, + "eval_bleu_bleu": 0.10091984243392385, + "eval_bleu_brevity_penalty": 0.9623085540847977, + "eval_bleu_length_ratio": 0.9630013555537836, + "eval_bleu_precisions": [ + 0.3922026644818555, + 0.15462057399136941, + 0.06736816208541979, + 0.029608496155725413 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229463, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.26133019201357, + "eval_chrf_word_order": 2, + "eval_loss": 2.056267261505127, + "eval_meteor": 0.3085028819053107, + "eval_runtime": 1074.6606, + "eval_samples_per_second": 16.003, + "eval_scarebleu_bp": 0.9895624394988061, + "eval_scarebleu_counts": [ + 103821, + 39649, + 16643, + 7097 + ], + "eval_scarebleu_precisions": [ + 41.84913174569904, + 17.172320898786865, + 7.787401095841697, + 3.609206859374682 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.79704249835883, + "eval_scarebleu_sys_len": 248084, + "eval_scarebleu_totals": [ + 248084, + 230889, + 213717, + 196636 + ], + "eval_steps_per_second": 0.501, + "eval_ter_num_edits": 155982, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.43046861047127, + "step": 197000 + }, + { + "epoch": 77.36, + "learning_rate": 3.091048164232136e-05, + "loss": 1.7836, + "step": 197500 + }, + { + "epoch": 77.36, + "eval_bleu_bleu": 0.10025328820409289, + "eval_bleu_brevity_penalty": 0.9605389736957658, + "eval_bleu_length_ratio": 0.9612974706121815, + "eval_bleu_precisions": [ + 0.39243943647214447, + 0.15418999159830454, + 0.06701592193117617, + 0.029263597525624643 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229057, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.28300096185606, + "eval_chrf_word_order": 2, + "eval_loss": 2.054814577102661, + "eval_meteor": 0.30840383990065334, + "eval_runtime": 1098.2442, + "eval_samples_per_second": 15.66, + "eval_scarebleu_bp": 0.9863934031468995, + "eval_scarebleu_counts": [ + 103594, + 39389, + 16454, + 6980 + ], + "eval_scarebleu_precisions": [ + 41.89018152115455, + 17.117911900705767, + 7.727422157516555, + 3.5637882354142523 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.693043048784567, + "eval_scarebleu_sys_len": 247299, + "eval_scarebleu_totals": [ + 247299, + 230104, + 212930, + 195859 + ], + "eval_steps_per_second": 0.49, + "eval_ter_num_edits": 155989, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.43367419368134, + "step": 197500 + }, + { + "epoch": 77.56, + "learning_rate": 3.086113304382155e-05, + "loss": 1.7908, + "step": 198000 + }, + { + "epoch": 77.56, + "eval_bleu_bleu": 0.10106615808361132, + "eval_bleu_brevity_penalty": 0.9578439646028161, + "eval_bleu_length_ratio": 0.9587080691122591, + "eval_bleu_precisions": [ + 0.3929259324111364, + 0.15475869251343227, + 0.06792419777003772, + 0.030009150164364062 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228440, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.228151370887325, + "eval_chrf_word_order": 2, + "eval_loss": 2.0554449558258057, + "eval_meteor": 0.30758583022036573, + "eval_runtime": 1108.2631, + "eval_samples_per_second": 15.518, + "eval_scarebleu_bp": 0.9823217202737443, + "eval_scarebleu_counts": [ + 103374, + 39366, + 16590, + 7113 + ], + "eval_scarebleu_precisions": [ + 41.97178981217569, + 17.182964569902094, + 7.828204184479488, + 3.650444180997983 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.769814201737642, + "eval_scarebleu_sys_len": 246294, + "eval_scarebleu_totals": [ + 246294, + 229099, + 211926, + 194853 + ], + "eval_steps_per_second": 0.485, + "eval_ter_num_edits": 155988, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.43321625322275, + "step": 198000 + }, + { + "epoch": 77.75, + "learning_rate": 3.0811784445321756e-05, + "loss": 1.7915, + "step": 198500 + }, + { + "epoch": 77.75, + "eval_bleu_bleu": 0.1011977120825175, + "eval_bleu_brevity_penalty": 0.964435902948255, + "eval_bleu_length_ratio": 0.9650535716533979, + "eval_bleu_precisions": [ + 0.39229056498747567, + 0.15456600722890435, + 0.06758318166015664, + 0.029582087211711863 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229952, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.31213429062529, + "eval_chrf_word_order": 2, + "eval_loss": 2.052584648132324, + "eval_meteor": 0.309152746469292, + "eval_runtime": 1090.1051, + "eval_samples_per_second": 15.776, + "eval_scarebleu_bp": 0.989139130258955, + "eval_scarebleu_counts": [ + 103810, + 39596, + 16658, + 7094 + ], + "eval_scarebleu_precisions": [ + 41.862415769077224, + 17.157168607875764, + 7.798287541371933, + 3.609535197293103 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.79471607062925, + "eval_scarebleu_sys_len": 247979, + "eval_scarebleu_totals": [ + 247979, + 230784, + 213611, + 196535 + ], + "eval_steps_per_second": 0.494, + "eval_ter_num_edits": 155894, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.3901698501161, + "step": 198500 + }, + { + "epoch": 77.95, + "learning_rate": 3.0762534544018954e-05, + "loss": 1.7915, + "step": 199000 + }, + { + "epoch": 77.95, + "eval_bleu_bleu": 0.10081001949537771, + "eval_bleu_brevity_penalty": 0.9580844833281916, + "eval_bleu_length_ratio": 0.958938890963954, + "eval_bleu_precisions": [ + 0.39312895249349, + 0.1550970184571699, + 0.06767351059555574, + 0.029705877370795525 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228495, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.290781392629945, + "eval_chrf_word_order": 2, + "eval_loss": 2.0529062747955322, + "eval_meteor": 0.30843950984636703, + "eval_runtime": 1108.3098, + "eval_samples_per_second": 15.517, + "eval_scarebleu_bp": 0.9856127435245098, + "eval_scarebleu_counts": [ + 103605, + 39534, + 16605, + 7081 + ], + "eval_scarebleu_precisions": [ + 41.927351015353736, + 17.195349504808384, + 7.805412316616292, + 3.618866555254026 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.774040426340019, + "eval_scarebleu_sys_len": 247106, + "eval_scarebleu_totals": [ + 247106, + 229911, + 212737, + 195669 + ], + "eval_steps_per_second": 0.485, + "eval_ter_num_edits": 155896, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.39108573103326, + "step": 199000 + }, + { + "epoch": 78.14, + "learning_rate": 3.0713185945519143e-05, + "loss": 1.7688, + "step": 199500 + }, + { + "epoch": 78.14, + "eval_bleu_bleu": 0.10135551399253506, + "eval_bleu_brevity_penalty": 0.9610230742862015, + "eval_bleu_length_ratio": 0.9617633110765111, + "eval_bleu_precisions": [ + 0.3931700761013754, + 0.15535469139937633, + 0.06796704565870185, + 0.029802386215974485 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229168, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.33996694754644, + "eval_chrf_word_order": 2, + "eval_loss": 2.0575571060180664, + "eval_meteor": 0.3094906602219306, + "eval_runtime": 1105.9376, + "eval_samples_per_second": 15.551, + "eval_scarebleu_bp": 0.9847504887249178, + "eval_scarebleu_counts": [ + 103615, + 39563, + 16630, + 7075 + ], + "eval_scarebleu_precisions": [ + 41.96757299720932, + 17.22392010378845, + 7.824924950359015, + 3.6198516244563828 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.779596295680266, + "eval_scarebleu_sys_len": 246893, + "eval_scarebleu_totals": [ + 246893, + 229698, + 212526, + 195450 + ], + "eval_steps_per_second": 0.486, + "eval_ter_num_edits": 155827, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.35948783939112, + "step": 199500 + }, + { + "epoch": 78.34, + "learning_rate": 3.0663837347019347e-05, + "loss": 1.7749, + "step": 200000 + }, + { + "epoch": 78.34, + "eval_bleu_bleu": 0.10095483922020422, + "eval_bleu_brevity_penalty": 0.9611495139250277, + "eval_bleu_length_ratio": 0.9618850171437684, + "eval_bleu_precisions": [ + 0.3927145643267582, + 0.15498910387637851, + 0.06755730284025005, + 0.02960017547510447 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229197, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.34273184535744, + "eval_chrf_word_order": 2, + "eval_loss": 2.056079864501953, + "eval_meteor": 0.30853922355725355, + "eval_runtime": 1106.7408, + "eval_samples_per_second": 15.539, + "eval_scarebleu_bp": 0.9844304990452454, + "eval_scarebleu_counts": [ + 103521, + 39507, + 16553, + 7035 + ], + "eval_scarebleu_precisions": [ + 41.94292057986986, + 17.205457736511352, + 7.791590373128357, + 3.600749324379658 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.74278299225465, + "eval_scarebleu_sys_len": 246814, + "eval_scarebleu_totals": [ + 246814, + 229619, + 212447, + 195376 + ], + "eval_steps_per_second": 0.486, + "eval_ter_num_edits": 155936, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.4094033493765, + "step": 200000 + }, + { + "epoch": 78.54, + "learning_rate": 3.061448874851954e-05, + "loss": 1.7765, + "step": 200500 + }, + { + "epoch": 78.54, + "eval_bleu_bleu": 0.10154919950662648, + "eval_bleu_brevity_penalty": 0.9636663843505586, + "eval_bleu_length_ratio": 0.9643107449670344, + "eval_bleu_precisions": [ + 0.391979109998912, + 0.1548264182895851, + 0.06776790146200178, + 0.02998245230446653 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229775, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.40100043198402, + "eval_chrf_word_order": 2, + "eval_loss": 2.0549123287200928, + "eval_meteor": 0.3092642693664347, + "eval_runtime": 1093.1524, + "eval_samples_per_second": 15.732, + "eval_scarebleu_bp": 0.9878842879292329, + "eval_scarebleu_counts": [ + 103621, + 39647, + 16690, + 7148 + ], + "eval_scarebleu_precisions": [ + 41.83867112424698, + 17.20244887687495, + 7.824660103141116, + 3.6428312973636867 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.822906436741418, + "eval_scarebleu_sys_len": 247668, + "eval_scarebleu_totals": [ + 247668, + 230473, + 213300, + 196221 + ], + "eval_steps_per_second": 0.492, + "eval_ter_num_edits": 156025, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.45016005019028, + "step": 200500 + }, + { + "epoch": 78.73, + "learning_rate": 3.056523884721674e-05, + "loss": 1.7884, + "step": 201000 + }, + { + "epoch": 78.73, + "eval_bleu_bleu": 0.10119201859551542, + "eval_bleu_brevity_penalty": 0.9653394666902985, + "eval_bleu_length_ratio": 0.9659264979288985, + "eval_bleu_precisions": [ + 0.392005561348627, + 0.15463104265959196, + 0.06737349594492452, + 0.02956560655645996 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230160, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.38481170699987, + "eval_chrf_word_order": 2, + "eval_loss": 2.049964189529419, + "eval_meteor": 0.30943749584921787, + "eval_runtime": 1105.7877, + "eval_samples_per_second": 15.553, + "eval_scarebleu_bp": 0.9908111757754131, + "eval_scarebleu_counts": [ + 103900, + 39749, + 16663, + 7106 + ], + "eval_scarebleu_precisions": [ + 41.82870761773634, + 17.192548410676515, + 7.785502695934139, + 3.6081139404402243 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.812349761708242, + "eval_scarebleu_sys_len": 248394, + "eval_scarebleu_totals": [ + 248394, + 231199, + 214026, + 196945 + ], + "eval_steps_per_second": 0.487, + "eval_ter_num_edits": 155971, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.42543126542687, + "step": 201000 + }, + { + "epoch": 78.93, + "learning_rate": 3.0515890248716937e-05, + "loss": 1.7917, + "step": 201500 + }, + { + "epoch": 78.93, + "eval_bleu_bleu": 0.10131242098537344, + "eval_bleu_brevity_penalty": 0.9607832327660543, + "eval_bleu_length_ratio": 0.9615324892248163, + "eval_bleu_precisions": [ + 0.3934084927524846, + 0.1551401957360866, + 0.06781131746088796, + 0.0298730017612073 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229113, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.33969944445065, + "eval_chrf_word_order": 2, + "eval_loss": 2.04858660697937, + "eval_meteor": 0.30913630860566216, + "eval_runtime": 1068.8895, + "eval_samples_per_second": 16.09, + "eval_scarebleu_bp": 0.9873875701098717, + "eval_scarebleu_counts": [ + 103915, + 39672, + 16646, + 7108 + ], + "eval_scarebleu_precisions": [ + 41.978226181098385, + 17.222487518992835, + 7.80842480532883, + 3.6245703854038123 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.809258758416643, + "eval_scarebleu_sys_len": 247545, + "eval_scarebleu_totals": [ + 247545, + 230350, + 213180, + 196106 + ], + "eval_steps_per_second": 0.503, + "eval_ter_num_edits": 155780, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.33796463783779, + "step": 201500 + }, + { + "epoch": 79.12, + "learning_rate": 3.0466541650217133e-05, + "loss": 1.7778, + "step": 202000 + }, + { + "epoch": 79.12, + "eval_bleu_bleu": 0.1013359152889202, + "eval_bleu_brevity_penalty": 0.9597098103399095, + "eval_bleu_length_ratio": 0.9605000860335993, + "eval_bleu_precisions": [ + 0.3933070298470291, + 0.1555378132204543, + 0.06809348523484413, + 0.029841495230206624 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228867, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.38641065309454, + "eval_chrf_word_order": 2, + "eval_loss": 2.052891731262207, + "eval_meteor": 0.30931004075498486, + "eval_runtime": 1104.9635, + "eval_samples_per_second": 15.564, + "eval_scarebleu_bp": 0.9843899868336425, + "eval_scarebleu_counts": [ + 103616, + 39676, + 16707, + 7113 + ], + "eval_scarebleu_precisions": [ + 41.983112105152266, + 17.27981046039136, + 7.8644862452691635, + 3.640951878829449 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.817943579506181, + "eval_scarebleu_sys_len": 246804, + "eval_scarebleu_totals": [ + 246804, + 229609, + 212436, + 195361 + ], + "eval_steps_per_second": 0.487, + "eval_ter_num_edits": 155868, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.37826339819297, + "step": 202000 + }, + { + "epoch": 79.32, + "learning_rate": 3.0417193051717336e-05, + "loss": 1.7746, + "step": 202500 + }, + { + "epoch": 79.32, + "eval_bleu_bleu": 0.10139222548393123, + "eval_bleu_brevity_penalty": 0.961811980777054, + "eval_bleu_length_ratio": 0.9625229248066343, + "eval_bleu_precisions": [ + 0.39285106976703627, + 0.15492519584829886, + 0.06791047837860015, + 0.029879347453483862 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229349, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.40408976140816, + "eval_chrf_word_order": 2, + "eval_loss": 2.0556881427764893, + "eval_meteor": 0.3090082524177811, + "eval_runtime": 1101.6429, + "eval_samples_per_second": 15.611, + "eval_scarebleu_bp": 0.9873269780939985, + "eval_scarebleu_counts": [ + 103778, + 39669, + 16719, + 7144 + ], + "eval_scarebleu_precisions": [ + 41.92542318102856, + 17.222306640328217, + 7.8434040157628075, + 3.643373690598831 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.833283601686688, + "eval_scarebleu_sys_len": 247530, + "eval_scarebleu_totals": [ + 247530, + 230335, + 213160, + 196082 + ], + "eval_steps_per_second": 0.488, + "eval_ter_num_edits": 155868, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.37826339819297, + "step": 202500 + }, + { + "epoch": 79.51, + "learning_rate": 3.036794315041453e-05, + "loss": 1.7734, + "step": 203000 + }, + { + "epoch": 79.51, + "eval_bleu_bleu": 0.10096838528170382, + "eval_bleu_brevity_penalty": 0.959775294605579, + "eval_bleu_length_ratio": 0.9605630374476979, + "eval_bleu_precisions": [ + 0.39273949021766674, + 0.15483237043370637, + 0.0677184540883995, + 0.029743358593683975 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228882, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.31652074525891, + "eval_chrf_word_order": 2, + "eval_loss": 2.0509676933288574, + "eval_meteor": 0.3079202172629952, + "eval_runtime": 1109.0287, + "eval_samples_per_second": 15.507, + "eval_scarebleu_bp": 0.9853254066392012, + "eval_scarebleu_counts": [ + 103563, + 39503, + 16600, + 7082 + ], + "eval_scarebleu_precisions": [ + 41.92239965996721, + 17.187173686042463, + 7.805630398698435, + 3.6208024868092763 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.770516913223933, + "eval_scarebleu_sys_len": 247035, + "eval_scarebleu_totals": [ + 247035, + 229840, + 212667, + 195592 + ], + "eval_steps_per_second": 0.485, + "eval_ter_num_edits": 155909, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.3970389569948, + "step": 203000 + }, + { + "epoch": 79.71, + "learning_rate": 3.0318594551914724e-05, + "loss": 1.773, + "step": 203500 + }, + { + "epoch": 79.71, + "eval_bleu_bleu": 0.10107457422062137, + "eval_bleu_brevity_penalty": 0.9604778999725636, + "eval_bleu_length_ratio": 0.9612387159590228, + "eval_bleu_precisions": [ + 0.39327549848718363, + 0.15509705071560742, + 0.06764669625246549, + 0.029721529532955433 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229043, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.335506130133645, + "eval_chrf_word_order": 2, + "eval_loss": 2.0472068786621094, + "eval_meteor": 0.3089059497447666, + "eval_runtime": 1104.3262, + "eval_samples_per_second": 15.573, + "eval_scarebleu_bp": 0.9887519494981526, + "eval_scarebleu_counts": [ + 103982, + 39710, + 16677, + 7119 + ], + "eval_scarebleu_precisions": [ + 41.94801579777556, + 17.213725898182826, + 7.810692457204412, + 3.62400733048259 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.82234369045562, + "eval_scarebleu_sys_len": 247883, + "eval_scarebleu_totals": [ + 247883, + 230688, + 213515, + 196440 + ], + "eval_steps_per_second": 0.487, + "eval_ter_num_edits": 155828, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.35994577984971, + "step": 203500 + }, + { + "epoch": 79.91, + "learning_rate": 3.0269245953414927e-05, + "loss": 1.7733, + "step": 204000 + }, + { + "epoch": 79.91, + "eval_bleu_bleu": 0.10114144935625693, + "eval_bleu_brevity_penalty": 0.9652395921246778, + "eval_bleu_length_ratio": 0.9658299724272806, + "eval_bleu_precisions": [ + 0.3923315242659807, + 0.15458199885414808, + 0.06744235935887875, + 0.029473472196579333 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230137, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.41554073199675, + "eval_chrf_word_order": 2, + "eval_loss": 2.0497422218322754, + "eval_meteor": 0.30960631664362587, + "eval_runtime": 1112.8553, + "eval_samples_per_second": 15.454, + "eval_scarebleu_bp": 0.9877025901643492, + "eval_scarebleu_counts": [ + 103769, + 39620, + 16607, + 7061 + ], + "eval_scarebleu_precisions": [ + 41.90604265354995, + 17.194090995885915, + 7.787390682516237, + 3.599282284455953 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.77449063348636, + "eval_scarebleu_sys_len": 247623, + "eval_scarebleu_totals": [ + 247623, + 230428, + 213255, + 196178 + ], + "eval_steps_per_second": 0.483, + "eval_ter_num_edits": 155920, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.4020763020392, + "step": 204000 + }, + { + "epoch": 80.1, + "learning_rate": 3.0219897354915123e-05, + "loss": 1.7702, + "step": 204500 + }, + { + "epoch": 80.1, + "eval_bleu_bleu": 0.1021156298925608, + "eval_bleu_brevity_penalty": 0.9633357943695197, + "eval_bleu_length_ratio": 0.9639917911356015, + "eval_bleu_precisions": [ + 0.392892437494286, + 0.15565354063923503, + 0.06823347530510279, + 0.030257143658338242 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229699, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.39818741051737, + "eval_chrf_word_order": 2, + "eval_loss": 2.0484650135040283, + "eval_meteor": 0.3096106257764963, + "eval_runtime": 1099.4428, + "eval_samples_per_second": 15.642, + "eval_scarebleu_bp": 0.9871249785254594, + "eval_scarebleu_counts": [ + 103848, + 39819, + 16787, + 7222 + ], + "eval_scarebleu_precisions": [ + 41.96217876192016, + 17.291182664958637, + 7.87707871917114, + 3.683942052642318 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.890834036893752, + "eval_scarebleu_sys_len": 247480, + "eval_scarebleu_totals": [ + 247480, + 230285, + 213112, + 196040 + ], + "eval_steps_per_second": 0.489, + "eval_ter_num_edits": 155814, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.35353461342956, + "step": 204500 + }, + { + "epoch": 80.3, + "learning_rate": 3.0170647453612317e-05, + "loss": 1.7579, + "step": 205000 + }, + { + "epoch": 80.3, + "eval_bleu_bleu": 0.10103228112632041, + "eval_bleu_brevity_penalty": 0.9622214531179675, + "eval_bleu_length_ratio": 0.9629174203349855, + "eval_bleu_precisions": [ + 0.3925768055682675, + 0.15483773698692097, + 0.06754457008703854, + 0.02960387754070463 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229443, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.40057672423158, + "eval_chrf_word_order": 2, + "eval_loss": 2.054286241531372, + "eval_meteor": 0.3090049084122546, + "eval_runtime": 1114.6415, + "eval_samples_per_second": 15.429, + "eval_scarebleu_bp": 0.985997081127211, + "eval_scarebleu_counts": [ + 103686, + 39567, + 16593, + 7058 + ], + "eval_scarebleu_precisions": [ + 41.944005080885596, + 17.20259471492048, + 7.796290031574199, + 3.605379974765405 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.766609761380339, + "eval_scarebleu_sys_len": 247201, + "eval_scarebleu_totals": [ + 247201, + 230006, + 212832, + 195763 + ], + "eval_steps_per_second": 0.483, + "eval_ter_num_edits": 155983, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.43092655092985, + "step": 205000 + }, + { + "epoch": 80.49, + "learning_rate": 3.0121298855112517e-05, + "loss": 1.7609, + "step": 205500 + }, + { + "epoch": 80.49, + "eval_bleu_bleu": 0.1016102699239683, + "eval_bleu_brevity_penalty": 0.9614590081929065, + "eval_bleu_length_ratio": 0.9621829871705018, + "eval_bleu_precisions": [ + 0.39288518240661585, + 0.15542761219014206, + 0.06802009101496564, + 0.030032832598722678 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229268, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.47668541730323, + "eval_chrf_word_order": 2, + "eval_loss": 2.051790714263916, + "eval_meteor": 0.309299875481607, + "eval_runtime": 1110.6368, + "eval_samples_per_second": 15.485, + "eval_scarebleu_bp": 0.9871209381231929, + "eval_scarebleu_counts": [ + 103764, + 39762, + 16707, + 7157 + ], + "eval_scarebleu_precisions": [ + 41.92840604657365, + 17.26650570599781, + 7.839576558694764, + 3.6508227996612903 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.84320934628169, + "eval_scarebleu_sys_len": 247479, + "eval_scarebleu_totals": [ + 247479, + 230284, + 213111, + 196038 + ], + "eval_steps_per_second": 0.484, + "eval_ter_num_edits": 155759, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.32834788820757, + "step": 205500 + }, + { + "epoch": 80.69, + "learning_rate": 3.0071950256612713e-05, + "loss": 1.7676, + "step": 206000 + }, + { + "epoch": 80.69, + "eval_bleu_bleu": 0.10205920041426343, + "eval_bleu_brevity_penalty": 0.9648399975652193, + "eval_bleu_length_ratio": 0.9654438704208093, + "eval_bleu_precisions": [ + 0.39330565758873265, + 0.15528306319003993, + 0.06809273898890586, + 0.030104565504578937 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230045, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.404426766858315, + "eval_chrf_word_order": 2, + "eval_loss": 2.047302722930908, + "eval_meteor": 0.309922568568182, + "eval_runtime": 1120.5341, + "eval_samples_per_second": 15.348, + "eval_scarebleu_bp": 0.9865834209996415, + "eval_scarebleu_counts": [ + 103893, + 39735, + 16718, + 7163 + ], + "eval_scarebleu_precisions": [ + 42.00310496227956, + 17.264752271334906, + 7.8496739084502085, + 3.6564200467580728 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.850077046200802, + "eval_scarebleu_sys_len": 247346, + "eval_scarebleu_totals": [ + 247346, + 230151, + 212977, + 195902 + ], + "eval_steps_per_second": 0.48, + "eval_ter_num_edits": 155865, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.37688957681722, + "step": 206000 + }, + { + "epoch": 80.89, + "learning_rate": 3.002260165811291e-05, + "loss": 1.7747, + "step": 206500 + }, + { + "epoch": 80.89, + "eval_bleu_bleu": 0.10234918911475198, + "eval_bleu_brevity_penalty": 0.963092134365255, + "eval_bleu_length_ratio": 0.9637567725229668, + "eval_bleu_precisions": [ + 0.3934890242681031, + 0.1559911131194457, + 0.06857599328168286, + 0.030301330206515823 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229643, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.49987839318083, + "eval_chrf_word_order": 2, + "eval_loss": 2.043259620666504, + "eval_meteor": 0.31009723630391467, + "eval_runtime": 1084.5507, + "eval_samples_per_second": 15.857, + "eval_scarebleu_bp": 0.9843859355236209, + "eval_scarebleu_counts": [ + 103787, + 39808, + 16784, + 7188 + ], + "eval_scarebleu_precisions": [ + 42.052568242687485, + 17.33737500435525, + 7.900806838829943, + 3.679380013206456 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.87738650387243, + "eval_scarebleu_sys_len": 246803, + "eval_scarebleu_totals": [ + 246803, + 229608, + 212434, + 195359 + ], + "eval_steps_per_second": 0.496, + "eval_ter_num_edits": 155809, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.35124491113666, + "step": 206500 + }, + { + "epoch": 81.08, + "learning_rate": 2.9973351756810107e-05, + "loss": 1.7656, + "step": 207000 + }, + { + "epoch": 81.08, + "eval_bleu_bleu": 0.10159771902559415, + "eval_bleu_brevity_penalty": 0.9611277150834258, + "eval_bleu_length_ratio": 0.9618640333390689, + "eval_bleu_precisions": [ + 0.3934125100352543, + 0.15536068906635472, + 0.06792414093976955, + 0.0300744690424766 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229192, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.41700025541714, + "eval_chrf_word_order": 2, + "eval_loss": 2.0497632026672363, + "eval_meteor": 0.3090848557938445, + "eval_runtime": 1086.613, + "eval_samples_per_second": 15.827, + "eval_scarebleu_bp": 0.9845520259865983, + "eval_scarebleu_counts": [ + 103736, + 39669, + 16641, + 7127 + ], + "eval_scarebleu_precisions": [ + 42.024922623195216, + 17.27375255280885, + 7.831943372427944, + 3.6474086356634374 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.814777969093283, + "eval_scarebleu_sys_len": 246844, + "eval_scarebleu_totals": [ + 246844, + 229649, + 212476, + 195399 + ], + "eval_steps_per_second": 0.495, + "eval_ter_num_edits": 155752, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.3251423049975, + "step": 207000 + }, + { + "epoch": 81.28, + "learning_rate": 2.9924003158310304e-05, + "loss": 1.7501, + "step": 207500 + }, + { + "epoch": 81.28, + "eval_bleu_bleu": 0.10170787821585658, + "eval_bleu_brevity_penalty": 0.9628919422932362, + "eval_bleu_length_ratio": 0.963563721519731, + "eval_bleu_precisions": [ + 0.3928927642782789, + 0.15492791969943787, + 0.06814177422659291, + 0.03001172859251278 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229597, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.44242498687022, + "eval_chrf_word_order": 2, + "eval_loss": 2.0475826263427734, + "eval_meteor": 0.3086991422875586, + "eval_runtime": 1075.2283, + "eval_samples_per_second": 15.995, + "eval_scarebleu_bp": 0.9876945139512098, + "eval_scarebleu_counts": [ + 103905, + 39650, + 16700, + 7134 + ], + "eval_scarebleu_precisions": [ + 41.961303766643375, + 17.20725959744126, + 7.831073888761237, + 3.636530462441889 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.827418129656895, + "eval_scarebleu_sys_len": 247621, + "eval_scarebleu_totals": [ + 247621, + 230426, + 213253, + 196176 + ], + "eval_steps_per_second": 0.5, + "eval_ter_num_edits": 155848, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.36910458902133, + "step": 207500 + }, + { + "epoch": 81.47, + "learning_rate": 2.9874654559810507e-05, + "loss": 1.7597, + "step": 208000 + }, + { + "epoch": 81.47, + "eval_bleu_bleu": 0.10176635707638586, + "eval_bleu_brevity_penalty": 0.9647357301622921, + "eval_bleu_length_ratio": 0.9653431481582515, + "eval_bleu_precisions": [ + 0.39342060072775964, + 0.15520190202324904, + 0.067830566685747, + 0.029895366218236172 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230021, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.465963008468854, + "eval_chrf_word_order": 2, + "eval_loss": 2.0480470657348633, + "eval_meteor": 0.31003106269254993, + "eval_runtime": 1091.863, + "eval_samples_per_second": 15.751, + "eval_scarebleu_bp": 0.9890342834410488, + "eval_scarebleu_counts": [ + 104080, + 39811, + 16704, + 7153 + ], + "eval_scarebleu_precisions": [ + 41.975697007094084, + 17.25227294394994, + 7.820737314243443, + 3.639999796449054 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.851127480936714, + "eval_scarebleu_sys_len": 247953, + "eval_scarebleu_totals": [ + 247953, + 230758, + 213586, + 196511 + ], + "eval_steps_per_second": 0.493, + "eval_ter_num_edits": 155770, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.33338523325197, + "step": 208000 + }, + { + "epoch": 81.67, + "learning_rate": 2.98253059613107e-05, + "loss": 1.7603, + "step": 208500 + }, + { + "epoch": 81.67, + "eval_bleu_bleu": 0.10158964283732573, + "eval_bleu_brevity_penalty": 0.959906250791406, + "eval_bleu_length_ratio": 0.960688940275895, + "eval_bleu_precisions": [ + 0.3937189837142657, + 0.1556747922934861, + 0.06826896388663302, + 0.02998157839884175 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228912, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.500188933335394, + "eval_chrf_word_order": 2, + "eval_loss": 2.04895281791687, + "eval_meteor": 0.30950405295350136, + "eval_runtime": 1102.6309, + "eval_samples_per_second": 15.597, + "eval_scarebleu_bp": 0.9850096469609386, + "eval_scarebleu_counts": [ + 103801, + 39758, + 16771, + 7153 + ], + "eval_scarebleu_precisions": [ + 42.03201367039606, + 17.303992827360485, + 7.888931224099084, + 3.6585989606776055 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.85646869110364, + "eval_scarebleu_sys_len": 246957, + "eval_scarebleu_totals": [ + 246957, + 229762, + 212589, + 195512 + ], + "eval_steps_per_second": 0.488, + "eval_ter_num_edits": 155759, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.32834788820757, + "step": 208500 + }, + { + "epoch": 81.86, + "learning_rate": 2.9775957362810896e-05, + "loss": 1.7701, + "step": 209000 + }, + { + "epoch": 81.86, + "eval_bleu_bleu": 0.10180174654480657, + "eval_bleu_brevity_penalty": 0.9596705178050903, + "eval_bleu_length_ratio": 0.9604623151851401, + "eval_bleu_precisions": [ + 0.39417018413164495, + 0.1559554574961141, + 0.06833898026231228, + 0.030142513397611814 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228858, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.500483817160976, + "eval_chrf_word_order": 2, + "eval_loss": 2.046210289001465, + "eval_meteor": 0.31003384040423076, + "eval_runtime": 1090.0946, + "eval_samples_per_second": 15.777, + "eval_scarebleu_bp": 0.9858797724577286, + "eval_scarebleu_counts": [ + 103935, + 39805, + 16762, + 7158 + ], + "eval_scarebleu_precisions": [ + 42.049665819753045, + 17.308252564386873, + 7.876768654577238, + 3.657097313121714 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.863123484871595, + "eval_scarebleu_sys_len": 247172, + "eval_scarebleu_totals": [ + 247172, + 229977, + 212803, + 195729 + ], + "eval_steps_per_second": 0.494, + "eval_ter_num_edits": 155592, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.25187183162444, + "step": 209000 + }, + { + "epoch": 82.06, + "learning_rate": 2.9726707461508097e-05, + "loss": 1.7647, + "step": 209500 + }, + { + "epoch": 82.06, + "eval_bleu_bleu": 0.1022739624747015, + "eval_bleu_brevity_penalty": 0.9637011771709733, + "eval_bleu_length_ratio": 0.9643443190545536, + "eval_bleu_precisions": [ + 0.3936453088348572, + 0.15575667488287204, + 0.06841975990912161, + 0.030238307462033938 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229783, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.53485184451476, + "eval_chrf_word_order": 2, + "eval_loss": 2.0481340885162354, + "eval_meteor": 0.31036813026788423, + "eval_runtime": 1092.3118, + "eval_samples_per_second": 15.745, + "eval_scarebleu_bp": 0.9872825416450992, + "eval_scarebleu_counts": [ + 104023, + 39880, + 16837, + 7210 + ], + "eval_scarebleu_precisions": [ + 42.026268690484365, + 17.31473923690106, + 7.899132066619751, + 3.677145596605398 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.90414490224999, + "eval_scarebleu_sys_len": 247519, + "eval_scarebleu_totals": [ + 247519, + 230324, + 213150, + 196076 + ], + "eval_steps_per_second": 0.493, + "eval_ter_num_edits": 155686, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.29491823473111, + "step": 209500 + }, + { + "epoch": 82.26, + "learning_rate": 2.9677358863008293e-05, + "loss": 1.7399, + "step": 210000 + }, + { + "epoch": 82.26, + "eval_bleu_bleu": 0.10133573416005517, + "eval_bleu_brevity_penalty": 0.9649963790047894, + "eval_bleu_length_ratio": 0.9655949538146459, + "eval_bleu_precisions": [ + 0.39229662597085374, + 0.1546837274409778, + 0.06762514944360995, + 0.029633319155604305 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230081, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.506263173049554, + "eval_chrf_word_order": 2, + "eval_loss": 2.0484273433685303, + "eval_meteor": 0.30940548107061355, + "eval_runtime": 1072.1161, + "eval_samples_per_second": 16.041, + "eval_scarebleu_bp": 0.9880215490585367, + "eval_scarebleu_counts": [ + 103758, + 39645, + 16636, + 7071 + ], + "eval_scarebleu_precisions": [ + 41.888236671484286, + 17.19904384682461, + 7.7981006309355285, + 3.6028737389177623 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.78487503994148, + "eval_scarebleu_sys_len": 247702, + "eval_scarebleu_totals": [ + 247702, + 230507, + 213334, + 196260 + ], + "eval_steps_per_second": 0.502, + "eval_ter_num_edits": 155958, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.41947803946532, + "step": 210000 + }, + { + "epoch": 82.45, + "learning_rate": 2.9628010264508486e-05, + "loss": 1.7534, + "step": 210500 + }, + { + "epoch": 82.45, + "eval_bleu_bleu": 0.10156697360554999, + "eval_bleu_brevity_penalty": 0.9597272732131478, + "eval_bleu_length_ratio": 0.9605168730773589, + "eval_bleu_precisions": [ + 0.3938856386348642, + 0.15587501653470398, + 0.0682463139279031, + 0.029935936082578784 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228871, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.45291167294383, + "eval_chrf_word_order": 2, + "eval_loss": 2.0457091331481934, + "eval_meteor": 0.3096404714055695, + "eval_runtime": 1077.0141, + "eval_samples_per_second": 15.968, + "eval_scarebleu_bp": 0.9858190902356517, + "eval_scarebleu_counts": [ + 103919, + 39821, + 16769, + 7134 + ], + "eval_scarebleu_precisions": [ + 42.0457442030774, + 17.316339221262645, + 7.880576533561415, + 3.644984442139576 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.855098688758046, + "eval_scarebleu_sys_len": 247157, + "eval_scarebleu_totals": [ + 247157, + 229962, + 212789, + 195721 + ], + "eval_steps_per_second": 0.5, + "eval_ter_num_edits": 155618, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.26377828354758, + "step": 210500 + }, + { + "epoch": 82.65, + "learning_rate": 2.957866166600869e-05, + "loss": 1.7507, + "step": 211000 + }, + { + "epoch": 82.65, + "eval_bleu_bleu": 0.10233276358477074, + "eval_bleu_brevity_penalty": 0.9605127996816428, + "eval_bleu_length_ratio": 0.9612722900465421, + "eval_bleu_precisions": [ + 0.39411746728894437, + 0.15625708028094554, + 0.0687742366265184, + 0.03041970638566153 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229051, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.504494106049826, + "eval_chrf_word_order": 2, + "eval_loss": 2.0427370071411133, + "eval_meteor": 0.3103389944419855, + "eval_runtime": 1024.9361, + "eval_samples_per_second": 16.78, + "eval_scarebleu_bp": 0.9868461529608409, + "eval_scarebleu_counts": [ + 103997, + 39913, + 16888, + 7238 + ], + "eval_scarebleu_precisions": [ + 42.03410519338267, + 17.33719637210272, + 7.927038203555151, + 3.6935166994106092 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.927031760660647, + "eval_scarebleu_sys_len": 247411, + "eval_scarebleu_totals": [ + 247411, + 230216, + 213043, + 195965 + ], + "eval_steps_per_second": 0.525, + "eval_ter_num_edits": 155649, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.2779744377636, + "step": 211000 + }, + { + "epoch": 82.84, + "learning_rate": 2.9529411764705884e-05, + "loss": 1.7577, + "step": 211500 + }, + { + "epoch": 82.84, + "eval_bleu_bleu": 0.10238714972649084, + "eval_bleu_brevity_penalty": 0.9638403367877845, + "eval_bleu_length_ratio": 0.9644786154046308, + "eval_bleu_precisions": [ + 0.3936340099645367, + 0.15560154265826356, + 0.06849994883863707, + 0.030350417002959377 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229815, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.49753051017401, + "eval_chrf_word_order": 2, + "eval_loss": 2.039057493209839, + "eval_meteor": 0.30997651874001286, + "eval_runtime": 1051.4879, + "eval_samples_per_second": 16.356, + "eval_scarebleu_bp": 0.9873310176745013, + "eval_scarebleu_counts": [ + 104032, + 39796, + 16789, + 7212 + ], + "eval_scarebleu_precisions": [ + 42.02786721663145, + 17.277368713531537, + 7.876132349422742, + 3.6779405165027947 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.890385789627786, + "eval_scarebleu_sys_len": 247531, + "eval_scarebleu_totals": [ + 247531, + 230336, + 213163, + 196088 + ], + "eval_steps_per_second": 0.512, + "eval_ter_num_edits": 155562, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.238133617867, + "step": 211500 + }, + { + "epoch": 83.04, + "learning_rate": 2.948006316620608e-05, + "loss": 1.7575, + "step": 212000 + }, + { + "epoch": 83.04, + "eval_bleu_bleu": 0.10215443090375018, + "eval_bleu_brevity_penalty": 0.961293374825984, + "eval_bleu_length_ratio": 0.9620235102547854, + "eval_bleu_precisions": [ + 0.3940758190463726, + 0.15565354776334095, + 0.06859303960507815, + 0.030310016926373088 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229230, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.46770088442094, + "eval_chrf_word_order": 2, + "eval_loss": 2.043609380722046, + "eval_meteor": 0.30993826234299887, + "eval_runtime": 1045.8536, + "eval_samples_per_second": 16.444, + "eval_scarebleu_bp": 0.9861305537998551, + "eval_scarebleu_counts": [ + 103959, + 39715, + 16776, + 7191 + ], + "eval_scarebleu_precisions": [ + 42.04882823559866, + 17.264463851781656, + 7.881014347054015, + 3.6728502257543876 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.872918800280354, + "eval_scarebleu_sys_len": 247234, + "eval_scarebleu_totals": [ + 247234, + 230039, + 212866, + 195788 + ], + "eval_steps_per_second": 0.514, + "eval_ter_num_edits": 155651, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.27889031868077, + "step": 212000 + }, + { + "epoch": 83.24, + "learning_rate": 2.943071456770628e-05, + "loss": 1.7323, + "step": 212500 + }, + { + "epoch": 83.24, + "eval_bleu_bleu": 0.10213572683661733, + "eval_bleu_brevity_penalty": 0.9650485009078476, + "eval_bleu_length_ratio": 0.9656453149459248, + "eval_bleu_precisions": [ + 0.39350610405357833, + 0.15552518107262633, + 0.06838257457711112, + 0.02997895820741835 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230093, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.569026618517626, + "eval_chrf_word_order": 2, + "eval_loss": 2.044361114501953, + "eval_meteor": 0.3105513303419062, + "eval_runtime": 941.8898, + "eval_samples_per_second": 18.259, + "eval_scarebleu_bp": 0.9868421114465173, + "eval_scarebleu_counts": [ + 103970, + 39791, + 16772, + 7128 + ], + "eval_scarebleu_precisions": [ + 42.0233620306374, + 17.28427774037313, + 7.872626054956299, + 3.6373842267751892 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.8511469209831, + "eval_scarebleu_sys_len": 247410, + "eval_scarebleu_totals": [ + 247410, + 230215, + 213042, + 195965 + ], + "eval_steps_per_second": 0.571, + "eval_ter_num_edits": 155684, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.29400235381395, + "step": 212500 + }, + { + "epoch": 83.43, + "learning_rate": 2.9381365969206476e-05, + "loss": 1.7478, + "step": 213000 + }, + { + "epoch": 83.43, + "eval_bleu_bleu": 0.10230061006057854, + "eval_bleu_brevity_penalty": 0.9640273031360644, + "eval_bleu_length_ratio": 0.9646590761250466, + "eval_bleu_precisions": [ + 0.39375614509827805, + 0.15576757592999252, + 0.06837781710673037, + 0.03023680641943763 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229858, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.574137406252405, + "eval_chrf_word_order": 2, + "eval_loss": 2.041679620742798, + "eval_meteor": 0.30994413144026933, + "eval_runtime": 959.102, + "eval_samples_per_second": 17.931, + "eval_scarebleu_bp": 0.9884977815438599, + "eval_scarebleu_counts": [ + 104125, + 39904, + 16842, + 7213 + ], + "eval_scarebleu_precisions": [ + 42.01638285852635, + 17.302547425474256, + 7.8903354868330435, + 3.6730931793414605 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.909395834905013, + "eval_scarebleu_sys_len": 247820, + "eval_scarebleu_totals": [ + 247820, + 230625, + 213451, + 196374 + ], + "eval_steps_per_second": 0.561, + "eval_ter_num_edits": 155575, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.24408684382857, + "step": 213000 + }, + { + "epoch": 83.63, + "learning_rate": 2.9332116067903674e-05, + "loss": 1.7478, + "step": 213500 + }, + { + "epoch": 83.63, + "eval_bleu_bleu": 0.10244449205679151, + "eval_bleu_brevity_penalty": 0.9639446942533114, + "eval_bleu_length_ratio": 0.9645793376671885, + "eval_bleu_precisions": [ + 0.3933797136256249, + 0.15578149395233348, + 0.06871150580098627, + 0.030296237348546834 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229839, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.575378095515156, + "eval_chrf_word_order": 2, + "eval_loss": 2.0467095375061035, + "eval_meteor": 0.3100478715764116, + "eval_runtime": 935.8535, + "eval_samples_per_second": 18.377, + "eval_scarebleu_bp": 0.9859080895857133, + "eval_scarebleu_counts": [ + 103900, + 39804, + 16834, + 7202 + ], + "eval_scarebleu_precisions": [ + 42.034315212861934, + 17.30729094197857, + 7.910305388349286, + 3.6794457841173824 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.892923147814386, + "eval_scarebleu_sys_len": 247179, + "eval_scarebleu_totals": [ + 247179, + 229984, + 212811, + 195736 + ], + "eval_steps_per_second": 0.575, + "eval_ter_num_edits": 155739, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.31918907903594, + "step": 213500 + }, + { + "epoch": 83.82, + "learning_rate": 2.928276746940387e-05, + "loss": 1.7544, + "step": 214000 + }, + { + "epoch": 83.82, + "eval_bleu_bleu": 0.10198815556600191, + "eval_bleu_brevity_penalty": 0.9642403167408152, + "eval_bleu_length_ratio": 0.9648647174111021, + "eval_bleu_precisions": [ + 0.39375486609803095, + 0.1557128887885968, + 0.0681714744491207, + 0.029943642088043832 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229907, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.608039014501216, + "eval_chrf_word_order": 2, + "eval_loss": 2.040987491607666, + "eval_meteor": 0.3106529347748919, + "eval_runtime": 942.9195, + "eval_samples_per_second": 18.239, + "eval_scarebleu_bp": 0.9881951173618149, + "eval_scarebleu_counts": [ + 104163, + 39922, + 16814, + 7179 + ], + "eval_scarebleu_precisions": [ + 42.04444085652586, + 17.315983517675125, + 7.879949572821813, + 3.657250566749026 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.893267266828158, + "eval_scarebleu_sys_len": 247745, + "eval_scarebleu_totals": [ + 247745, + 230550, + 213377, + 196295 + ], + "eval_steps_per_second": 0.571, + "eval_ter_num_edits": 155515, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.21661041631367, + "step": 214000 + }, + { + "epoch": 84.02, + "learning_rate": 2.9233418870904067e-05, + "loss": 1.7533, + "step": 214500 + }, + { + "epoch": 84.02, + "eval_bleu_bleu": 0.10191391193563196, + "eval_bleu_brevity_penalty": 0.960787594014325, + "eval_bleu_length_ratio": 0.9615366859857561, + "eval_bleu_precisions": [ + 0.39440191345792924, + 0.15585671884068913, + 0.06843878043520676, + 0.03009244931605512 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229114, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.50407977523829, + "eval_chrf_word_order": 2, + "eval_loss": 2.0391087532043457, + "eval_meteor": 0.3099107918327601, + "eval_runtime": 940.7044, + "eval_samples_per_second": 18.282, + "eval_scarebleu_bp": 0.9829588701496721, + "eval_scarebleu_counts": [ + 103856, + 39723, + 16733, + 7126 + ], + "eval_scarebleu_precisions": [ + 42.14062836020142, + 17.326918379453538, + 7.8898355832386375, + 3.654190319421155 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.84010923638418, + "eval_scarebleu_sys_len": 246451, + "eval_scarebleu_totals": [ + 246451, + 229256, + 212083, + 195009 + ], + "eval_steps_per_second": 0.572, + "eval_ter_num_edits": 155530, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.2234795231924, + "step": 214500 + }, + { + "epoch": 84.21, + "learning_rate": 2.9184070272404263e-05, + "loss": 1.7294, + "step": 215000 + }, + { + "epoch": 84.21, + "eval_bleu_bleu": 0.10194631662284198, + "eval_bleu_brevity_penalty": 0.9650441575160555, + "eval_bleu_length_ratio": 0.9656411181849849, + "eval_bleu_precisions": [ + 0.3928254785042505, + 0.1554648491993781, + 0.06824974327796993, + 0.02987889505730659 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230092, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.59396059523569, + "eval_chrf_word_order": 2, + "eval_loss": 2.040893316268921, + "eval_meteor": 0.3103459894857326, + "eval_runtime": 932.5248, + "eval_samples_per_second": 18.442, + "eval_scarebleu_bp": 0.9873229384973843, + "eval_scarebleu_counts": [ + 103908, + 39826, + 16770, + 7145 + ], + "eval_scarebleu_precisions": [ + 41.97811165560399, + 17.29054329799335, + 7.867292797462951, + 3.643920848633211 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.858115435442194, + "eval_scarebleu_sys_len": 247529, + "eval_scarebleu_totals": [ + 247529, + 230334, + 213161, + 196080 + ], + "eval_steps_per_second": 0.577, + "eval_ter_num_edits": 155740, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.31964701949452, + "step": 215000 + }, + { + "epoch": 84.41, + "learning_rate": 2.913482037110146e-05, + "loss": 1.7349, + "step": 215500 + }, + { + "epoch": 84.41, + "eval_bleu_bleu": 0.1021620878120159, + "eval_bleu_brevity_penalty": 0.9637620617997801, + "eval_bleu_length_ratio": 0.9644030737077124, + "eval_bleu_precisions": [ + 0.39400862500380773, + 0.15600041391896596, + 0.06839369224629302, + 0.03003531588093503 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229797, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.646782978525124, + "eval_chrf_word_order": 2, + "eval_loss": 2.0416171550750732, + "eval_meteor": 0.3110908612346454, + "eval_runtime": 935.2899, + "eval_samples_per_second": 18.388, + "eval_scarebleu_bp": 0.9868097787516408, + "eval_scarebleu_counts": [ + 104105, + 39893, + 16809, + 7179 + ], + "eval_scarebleu_precisions": [ + 42.07928796048537, + 17.329186340988763, + 7.890252775365551, + 3.663652323017882 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.890397551546375, + "eval_scarebleu_sys_len": 247402, + "eval_scarebleu_totals": [ + 247402, + 230207, + 213035, + 195952 + ], + "eval_steps_per_second": 0.575, + "eval_ter_num_edits": 155549, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.23218039190544, + "step": 215500 + }, + { + "epoch": 84.61, + "learning_rate": 2.9085471772601657e-05, + "loss": 1.7319, + "step": 216000 + }, + { + "epoch": 84.61, + "eval_bleu_bleu": 0.10263915177360378, + "eval_bleu_brevity_penalty": 0.9679718093786221, + "eval_bleu_length_ratio": 0.9684739318194218, + "eval_bleu_precisions": [ + 0.3939948086164833, + 0.1559427265746446, + 0.06836649491884406, + 0.030095560932639022 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230767, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.59620826115884, + "eval_chrf_word_order": 2, + "eval_loss": 2.040022134780884, + "eval_meteor": 0.31141805703914227, + "eval_runtime": 923.6607, + "eval_samples_per_second": 18.619, + "eval_scarebleu_bp": 0.9920824929615539, + "eval_scarebleu_counts": [ + 104552, + 40106, + 16880, + 7210 + ], + "eval_scarebleu_precisions": [ + 42.03771460737405, + 17.32328358853638, + 7.875264763788712, + 3.655037462866644 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.937252024618772, + "eval_scarebleu_sys_len": 248710, + "eval_scarebleu_totals": [ + 248710, + 231515, + 214342, + 197262 + ], + "eval_steps_per_second": 0.582, + "eval_ter_num_edits": 155485, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.20287220255622, + "step": 216000 + }, + { + "epoch": 84.8, + "learning_rate": 2.903612317410186e-05, + "loss": 1.751, + "step": 216500 + }, + { + "epoch": 84.8, + "eval_bleu_bleu": 0.10226184534344322, + "eval_bleu_brevity_penalty": 0.9631487033915289, + "eval_bleu_length_ratio": 0.9638113304151855, + "eval_bleu_precisions": [ + 0.39442470477583863, + 0.1562733866450784, + 0.06843794962647401, + 0.030125551179777173 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229656, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.6323546165923, + "eval_chrf_word_order": 2, + "eval_loss": 2.0405428409576416, + "eval_meteor": 0.31120723192979627, + "eval_runtime": 941.0852, + "eval_samples_per_second": 18.275, + "eval_scarebleu_bp": 0.9855358585282771, + "eval_scarebleu_counts": [ + 104047, + 39944, + 16819, + 7173 + ], + "eval_scarebleu_precisions": [ + 42.109459421175536, + 17.3751152715188, + 7.906712172923777, + 3.6663906523139205 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.89345236302341, + "eval_scarebleu_sys_len": 247087, + "eval_scarebleu_totals": [ + 247087, + 229892, + 212718, + 195642 + ], + "eval_steps_per_second": 0.572, + "eval_ter_num_edits": 155468, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.19508721476033, + "step": 216500 + }, + { + "epoch": 85.0, + "learning_rate": 2.8986774575602056e-05, + "loss": 1.7553, + "step": 217000 + }, + { + "epoch": 85.0, + "eval_bleu_bleu": 0.102471595457886, + "eval_bleu_brevity_penalty": 0.9649181912345675, + "eval_bleu_length_ratio": 0.9655194121177275, + "eval_bleu_precisions": [ + 0.3934878707136741, + 0.15609203825845125, + 0.06850001021930631, + 0.03023077482802434 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230063, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.591843974581714, + "eval_chrf_word_order": 2, + "eval_loss": 2.0359482765197754, + "eval_meteor": 0.3112024613915133, + "eval_runtime": 937.0411, + "eval_samples_per_second": 18.354, + "eval_scarebleu_bp": 0.9886591654247, + "eval_scarebleu_counts": [ + 104202, + 40038, + 16895, + 7218 + ], + "eval_scarebleu_precisions": [ + 42.04066811909949, + 17.357639867340083, + 7.913645476177093, + 3.6748907918987443 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.932787988994054, + "eval_scarebleu_sys_len": 247860, + "eval_scarebleu_totals": [ + 247860, + 230665, + 213492, + 196414 + ], + "eval_steps_per_second": 0.574, + "eval_ter_num_edits": 155562, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.238133617867, + "step": 217000 + }, + { + "epoch": 85.19, + "learning_rate": 2.8937524674299247e-05, + "loss": 1.7217, + "step": 217500 + }, + { + "epoch": 85.19, + "eval_bleu_bleu": 0.1023053309278255, + "eval_bleu_brevity_penalty": 0.9615636051525098, + "eval_bleu_length_ratio": 0.9622837094330595, + "eval_bleu_precisions": [ + 0.3944228320220505, + 0.15622568918938032, + 0.06858113133986878, + 0.030322279623810355 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229292, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.55800756679096, + "eval_chrf_word_order": 2, + "eval_loss": 2.0416204929351807, + "eval_meteor": 0.31060171919920465, + "eval_runtime": 954.2416, + "eval_samples_per_second": 18.023, + "eval_scarebleu_bp": 0.9863812731384145, + "eval_scarebleu_counts": [ + 104083, + 39921, + 16857, + 7209 + ], + "eval_scarebleu_precisions": [ + 42.088428442028984, + 17.34933789944416, + 7.916760595130748, + 3.680915812262571 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.913299809858495, + "eval_scarebleu_sys_len": 247296, + "eval_scarebleu_totals": [ + 247296, + 230101, + 212928, + 195848 + ], + "eval_steps_per_second": 0.564, + "eval_ter_num_edits": 155458, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.19050781017452, + "step": 217500 + }, + { + "epoch": 85.39, + "learning_rate": 2.888817607579945e-05, + "loss": 1.7319, + "step": 218000 + }, + { + "epoch": 85.39, + "eval_bleu_bleu": 0.10186663169514606, + "eval_bleu_brevity_penalty": 0.9595482648881156, + "eval_bleu_length_ratio": 0.9603448058788228, + "eval_bleu_precisions": [ + 0.3952759690600009, + 0.15627377324166608, + 0.06837347539027952, + 0.03007366243779272 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 228830, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.55806899469199, + "eval_chrf_word_order": 2, + "eval_loss": 2.0377559661865234, + "eval_meteor": 0.31045906632946463, + "eval_runtime": 945.3498, + "eval_samples_per_second": 18.192, + "eval_scarebleu_bp": 0.9848476808151465, + "eval_scarebleu_counts": [ + 104195, + 39923, + 16769, + 7161 + ], + "eval_scarebleu_precisions": [ + 42.19839055229085, + 17.37883180539957, + 7.889437779346037, + 3.6633653236202908 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.883100079920803, + "eval_scarebleu_sys_len": 246917, + "eval_scarebleu_totals": [ + 246917, + 229722, + 212550, + 195476 + ], + "eval_steps_per_second": 0.569, + "eval_ter_num_edits": 155419, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.17264813228984, + "step": 218000 + }, + { + "epoch": 85.59, + "learning_rate": 2.8838827477299647e-05, + "loss": 1.7364, + "step": 218500 + }, + { + "epoch": 85.59, + "eval_bleu_bleu": 0.1022128283729478, + "eval_bleu_brevity_penalty": 0.9613413240392183, + "eval_bleu_length_ratio": 0.9620696746251244, + "eval_bleu_precisions": [ + 0.39463272276774225, + 0.15622553596861058, + 0.0685313178270708, + 0.030246628954441683 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229241, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.61692050486167, + "eval_chrf_word_order": 2, + "eval_loss": 2.0398831367492676, + "eval_meteor": 0.31037539743040105, + "eval_runtime": 945.3215, + "eval_samples_per_second": 18.193, + "eval_scarebleu_bp": 0.9862478334658153, + "eval_scarebleu_counts": [ + 104140, + 39874, + 16819, + 7191 + ], + "eval_scarebleu_precisions": [ + 42.117097988781175, + 17.331397673731246, + 7.900064350366609, + 3.6722687788212585 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.897352825630774, + "eval_scarebleu_sys_len": 247263, + "eval_scarebleu_totals": [ + 247263, + 230068, + 212897, + 195819 + ], + "eval_steps_per_second": 0.569, + "eval_ter_num_edits": 155537, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.22668510640247, + "step": 218500 + }, + { + "epoch": 85.78, + "learning_rate": 2.8789478878799843e-05, + "loss": 1.7328, + "step": 219000 + }, + { + "epoch": 85.78, + "eval_bleu_bleu": 0.10227211295204938, + "eval_bleu_brevity_penalty": 0.9645358549875258, + "eval_bleu_length_ratio": 0.9651500971550158, + "eval_bleu_precisions": [ + 0.39369496684422217, + 0.15581821599774415, + 0.06835666927374873, + 0.03014369071218179 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229975, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.6687104167623, + "eval_chrf_word_order": 2, + "eval_loss": 2.0384998321533203, + "eval_meteor": 0.31108051952404975, + "eval_runtime": 940.8303, + "eval_samples_per_second": 18.28, + "eval_scarebleu_bp": 0.9860739311750575, + "eval_scarebleu_counts": [ + 103926, + 39769, + 16750, + 7144 + ], + "eval_scarebleu_precisions": [ + 42.03786101448103, + 17.288990327138354, + 7.869280677274927, + 3.6490310453677126 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.851960253173841, + "eval_scarebleu_sys_len": 247220, + "eval_scarebleu_totals": [ + 247220, + 230025, + 212853, + 195778 + ], + "eval_steps_per_second": 0.572, + "eval_ter_num_edits": 155573, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.2431709629114, + "step": 219000 + }, + { + "epoch": 85.98, + "learning_rate": 2.874022897749704e-05, + "loss": 1.7466, + "step": 219500 + }, + { + "epoch": 85.98, + "eval_bleu_bleu": 0.10240963522949105, + "eval_bleu_brevity_penalty": 0.9625262745667328, + "eval_bleu_length_ratio": 0.9632111936007789, + "eval_bleu_precisions": [ + 0.39449617233010764, + 0.15631270076018047, + 0.06874977582151806, + 0.03022766190382618 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229513, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.59426690909778, + "eval_chrf_word_order": 2, + "eval_loss": 2.0320260524749756, + "eval_meteor": 0.3106614799809918, + "eval_runtime": 925.7447, + "eval_samples_per_second": 18.577, + "eval_scarebleu_bp": 0.9890262178508452, + "eval_scarebleu_counts": [ + 104388, + 40030, + 16953, + 7245 + ], + "eval_scarebleu_precisions": [ + 42.10025367915435, + 17.347327913467037, + 7.937429477065122, + 3.6868540372196694 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.958345186401349, + "eval_scarebleu_sys_len": 247951, + "eval_scarebleu_totals": [ + 247951, + 230756, + 213583, + 196509 + ], + "eval_steps_per_second": 0.581, + "eval_ter_num_edits": 155485, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.20287220255622, + "step": 219500 + }, + { + "epoch": 86.17, + "learning_rate": 2.8690880378997237e-05, + "loss": 1.7187, + "step": 220000 + }, + { + "epoch": 86.17, + "eval_bleu_bleu": 0.10256468299242397, + "eval_bleu_brevity_penalty": 0.9613195292162727, + "eval_bleu_length_ratio": 0.9620486908204248, + "eval_bleu_precisions": [ + 0.3941832870927777, + 0.1562763805113162, + 0.06885192064941863, + 0.030550104307828993 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229236, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.64516307003317, + "eval_chrf_word_order": 2, + "eval_loss": 2.03739070892334, + "eval_meteor": 0.31022024244000057, + "eval_runtime": 923.8492, + "eval_samples_per_second": 18.616, + "eval_scarebleu_bp": 0.984086093742525, + "eval_scarebleu_counts": [ + 103944, + 39900, + 16874, + 7231 + ], + "eval_scarebleu_precisions": [ + 42.128813394453026, + 17.383045649010604, + 7.945903438013572, + 3.702736471262955 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.922734990026989, + "eval_scarebleu_sys_len": 246729, + "eval_scarebleu_totals": [ + 246729, + 229534, + 212361, + 195288 + ], + "eval_steps_per_second": 0.582, + "eval_ter_num_edits": 155619, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.26423622400615, + "step": 220000 + }, + { + "epoch": 86.37, + "learning_rate": 2.8641531780497433e-05, + "loss": 1.7324, + "step": 220500 + }, + { + "epoch": 86.37, + "eval_bleu_bleu": 0.10248398953279456, + "eval_bleu_brevity_penalty": 0.9629049994743359, + "eval_bleu_length_ratio": 0.9635763118025508, + "eval_bleu_precisions": [ + 0.39466463414634145, + 0.15620630399472704, + 0.06861123204179365, + 0.030336700336700335 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229600, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.66439250328028, + "eval_chrf_word_order": 2, + "eval_loss": 2.04058575630188, + "eval_meteor": 0.31123113571668, + "eval_runtime": 928.2891, + "eval_samples_per_second": 18.527, + "eval_scarebleu_bp": 0.9885179559370456, + "eval_scarebleu_counts": [ + 104316, + 40013, + 16874, + 7227 + ], + "eval_scarebleu_precisions": [ + 42.09260566932311, + 17.34943415860903, + 7.90503094271031, + 3.6801099908340973 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.93434084822096, + "eval_scarebleu_sys_len": 247825, + "eval_scarebleu_totals": [ + 247825, + 230630, + 213459, + 196380 + ], + "eval_steps_per_second": 0.58, + "eval_ter_num_edits": 155340, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.13647083606189, + "step": 220500 + }, + { + "epoch": 86.56, + "learning_rate": 2.8592183181997633e-05, + "loss": 1.7291, + "step": 221000 + }, + { + "epoch": 86.56, + "eval_bleu_bleu": 0.10274918846209147, + "eval_bleu_brevity_penalty": 0.9610230742862015, + "eval_bleu_length_ratio": 0.9617633110765111, + "eval_bleu_precisions": [ + 0.39509442854150667, + 0.15654352205233685, + 0.06904056710794454, + 0.030601166669479273 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229168, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.61514647281226, + "eval_chrf_word_order": 2, + "eval_loss": 2.0389320850372314, + "eval_meteor": 0.3109852442880468, + "eval_runtime": 930.2108, + "eval_samples_per_second": 18.488, + "eval_scarebleu_bp": 0.9858029076966518, + "eval_scarebleu_counts": [ + 104224, + 39984, + 16931, + 7258 + ], + "eval_scarebleu_precisions": [ + 42.16983002431692, + 17.387522938971465, + 7.956895255282352, + 3.708586261164592 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.956057443062829, + "eval_scarebleu_sys_len": 247153, + "eval_scarebleu_totals": [ + 247153, + 229958, + 212784, + 195708 + ], + "eval_steps_per_second": 0.578, + "eval_ter_num_edits": 155420, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.17310607274842, + "step": 221000 + }, + { + "epoch": 86.76, + "learning_rate": 2.8542933280694827e-05, + "loss": 1.7289, + "step": 221500 + }, + { + "epoch": 86.76, + "eval_bleu_bleu": 0.10265672180176695, + "eval_bleu_brevity_penalty": 0.9648921273335971, + "eval_bleu_length_ratio": 0.9654942315520881, + "eval_bleu_precisions": [ + 0.39400235593787625, + 0.15599778260093394, + 0.06861312376728358, + 0.030381560609198426 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230057, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.64707984943971, + "eval_chrf_word_order": 2, + "eval_loss": 2.0375070571899414, + "eval_meteor": 0.31058960164779814, + "eval_runtime": 1072.3436, + "eval_samples_per_second": 16.038, + "eval_scarebleu_bp": 0.9873956487714382, + "eval_scarebleu_counts": [ + 104190, + 39930, + 16909, + 7253 + ], + "eval_scarebleu_precisions": [ + 42.0889770427434, + 17.334340487601583, + 7.931683107940127, + 3.698491129842382 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.94284006576418, + "eval_scarebleu_sys_len": 247547, + "eval_scarebleu_totals": [ + 247547, + 230352, + 213183, + 196107 + ], + "eval_steps_per_second": 0.502, + "eval_ter_num_edits": 155626, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.26744180721623, + "step": 221500 + }, + { + "epoch": 86.96, + "learning_rate": 2.849358468219503e-05, + "loss": 1.7283, + "step": 222000 + }, + { + "epoch": 86.96, + "eval_bleu_bleu": 0.10275204424973329, + "eval_bleu_brevity_penalty": 0.9632270246478422, + "eval_bleu_length_ratio": 0.9638868721121039, + "eval_bleu_precisions": [ + 0.3945940768219302, + 0.15675431454402552, + 0.06884634879351215, + 0.030408589122240173 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229674, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.6778936450839, + "eval_chrf_word_order": 2, + "eval_loss": 2.0356576442718506, + "eval_meteor": 0.3115784864209917, + "eval_runtime": 1054.6506, + "eval_samples_per_second": 16.307, + "eval_scarebleu_bp": 0.9867572359221459, + "eval_scarebleu_counts": [ + 104199, + 40093, + 16915, + 7226 + ], + "eval_scarebleu_precisions": [ + 42.11949601639523, + 17.4170482288852, + 7.940494409028176, + 3.6878071684112217 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.946169898382292, + "eval_scarebleu_sys_len": 247389, + "eval_scarebleu_totals": [ + 247389, + 230194, + 213022, + 195943 + ], + "eval_steps_per_second": 0.51, + "eval_ter_num_edits": 155350, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.1410502406477, + "step": 222000 + }, + { + "epoch": 87.15, + "learning_rate": 2.8444236083695224e-05, + "loss": 1.7184, + "step": 222500 + }, + { + "epoch": 87.15, + "eval_bleu_bleu": 0.10310275697298836, + "eval_bleu_brevity_penalty": 0.9607265348755878, + "eval_bleu_length_ratio": 0.9614779313325975, + "eval_bleu_precisions": [ + 0.39597119161938016, + 0.1574526320756943, + 0.06920296180666098, + 0.030742824985931345 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229100, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.665463718487736, + "eval_chrf_word_order": 2, + "eval_loss": 2.0361177921295166, + "eval_meteor": 0.31167019609614594, + "eval_runtime": 1066.1436, + "eval_samples_per_second": 16.131, + "eval_scarebleu_bp": 0.9862923153080767, + "eval_scarebleu_counts": [ + 104421, + 40186, + 16979, + 7299 + ], + "eval_scarebleu_precisions": [ + 42.22886352790831, + 17.466174661746617, + 7.974880933369656, + 3.7271933452824118 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.001457178519571, + "eval_scarebleu_sys_len": 247274, + "eval_scarebleu_totals": [ + 247274, + 230079, + 212906, + 195831 + ], + "eval_steps_per_second": 0.505, + "eval_ter_num_edits": 155219, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.08106004057353, + "step": 222500 + }, + { + "epoch": 87.35, + "learning_rate": 2.839488748519542e-05, + "loss": 1.7112, + "step": 223000 + }, + { + "epoch": 87.35, + "eval_bleu_bleu": 0.10259816036966414, + "eval_bleu_brevity_penalty": 0.9629354655918478, + "eval_bleu_length_ratio": 0.9636056891291301, + "eval_bleu_precisions": [ + 0.39448710187407177, + 0.15641771651319133, + 0.06864497492970587, + 0.030425804134587328 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229607, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.728717633462566, + "eval_chrf_word_order": 2, + "eval_loss": 2.0393762588500977, + "eval_meteor": 0.31152114412537874, + "eval_runtime": 1045.9978, + "eval_samples_per_second": 16.442, + "eval_scarebleu_bp": 0.9857664960399977, + "eval_scarebleu_counts": [ + 104169, + 40021, + 16877, + 7246 + ], + "eval_scarebleu_precisions": [ + 42.14911144919561, + 17.404293995625117, + 7.931815618302816, + 3.702662789925242 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.942821875519478, + "eval_scarebleu_sys_len": 247144, + "eval_scarebleu_totals": [ + 247144, + 229949, + 212776, + 195697 + ], + "eval_steps_per_second": 0.514, + "eval_ter_num_edits": 155398, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.16303138265963, + "step": 223000 + }, + { + "epoch": 87.54, + "learning_rate": 2.834563758389262e-05, + "loss": 1.7241, + "step": 223500 + }, + { + "epoch": 87.54, + "eval_bleu_bleu": 0.10234633877654381, + "eval_bleu_brevity_penalty": 0.9632270246478422, + "eval_bleu_length_ratio": 0.9638868721121039, + "eval_bleu_precisions": [ + 0.39442427092313453, + 0.15651429082403437, + 0.06851867969833964, + 0.030133390174674937 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229674, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.68876509890531, + "eval_chrf_word_order": 2, + "eval_loss": 2.0320358276367188, + "eval_meteor": 0.3109215875207694, + "eval_runtime": 1067.1794, + "eval_samples_per_second": 16.115, + "eval_scarebleu_bp": 0.9881345736601082, + "eval_scarebleu_counts": [ + 104361, + 40092, + 16870, + 7192 + ], + "eval_scarebleu_precisions": [ + 42.12691236426755, + 17.390851714490207, + 7.906750030464656, + 3.6640785800167106 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.92688171940788, + "eval_scarebleu_sys_len": 247730, + "eval_scarebleu_totals": [ + 247730, + 230535, + 213362, + 196284 + ], + "eval_steps_per_second": 0.504, + "eval_ter_num_edits": 155349, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.14059230018913, + "step": 223500 + }, + { + "epoch": 87.74, + "learning_rate": 2.8296288985392817e-05, + "loss": 1.7228, + "step": 224000 + }, + { + "epoch": 87.74, + "eval_bleu_bleu": 0.10294836757924734, + "eval_bleu_brevity_penalty": 0.9637794567518695, + "eval_bleu_length_ratio": 0.964419860751472, + "eval_bleu_precisions": [ + 0.39512012567395266, + 0.15696170380892355, + 0.06906767086560994, + 0.03039271740714582 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229801, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.74409085748456, + "eval_chrf_word_order": 2, + "eval_loss": 2.0357441902160645, + "eval_meteor": 0.31207561208312606, + "eval_runtime": 1057.1826, + "eval_samples_per_second": 16.268, + "eval_scarebleu_bp": 0.9899896004693272, + "eval_scarebleu_counts": [ + 104649, + 40299, + 17027, + 7263 + ], + "eval_scarebleu_precisions": [ + 42.164873685482895, + 17.445832160869283, + 7.96320286594862, + 3.6916742909423603 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.00519020179112, + "eval_scarebleu_sys_len": 248190, + "eval_scarebleu_totals": [ + 248190, + 230995, + 213821, + 196740 + ], + "eval_steps_per_second": 0.509, + "eval_ter_num_edits": 155212, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.07785445736346, + "step": 224000 + }, + { + "epoch": 87.94, + "learning_rate": 2.824694038689301e-05, + "loss": 1.7375, + "step": 224500 + }, + { + "epoch": 87.94, + "eval_bleu_bleu": 0.10271956705202691, + "eval_bleu_brevity_penalty": 0.9608093999815734, + "eval_bleu_length_ratio": 0.9615576697904558, + "eval_bleu_precisions": [ + 0.39541024533102886, + 0.15690530567561956, + 0.06901721579560799, + 0.03050849365015952 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229119, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.704788232756115, + "eval_chrf_word_order": 2, + "eval_loss": 2.0340096950531006, + "eval_meteor": 0.31152449692874556, + "eval_runtime": 1071.0856, + "eval_samples_per_second": 16.057, + "eval_scarebleu_bp": 0.9842481813691458, + "eval_scarebleu_counts": [ + 104208, + 40079, + 16921, + 7249 + ], + "eval_scarebleu_precisions": [ + 42.228967171727405, + 17.457987402754668, + 7.96653499748118, + 3.711269480452991 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.959245178099605, + "eval_scarebleu_sys_len": 246769, + "eval_scarebleu_totals": [ + 246769, + 229574, + 212401, + 195324 + ], + "eval_steps_per_second": 0.502, + "eval_ter_num_edits": 155256, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.09800383754104, + "step": 224500 + }, + { + "epoch": 88.13, + "learning_rate": 2.8197591788393213e-05, + "loss": 1.7115, + "step": 225000 + }, + { + "epoch": 88.13, + "eval_bleu_bleu": 0.10225268040131115, + "eval_bleu_brevity_penalty": 0.9656346917061492, + "eval_bleu_length_ratio": 0.9662118776728121, + "eval_bleu_precisions": [ + 0.39390082874368015, + 0.15607910511516995, + 0.06818123803446076, + 0.029995135017251116 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230228, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.68634296250942, + "eval_chrf_word_order": 2, + "eval_loss": 2.0377910137176514, + "eval_meteor": 0.31107481707076506, + "eval_runtime": 1056.7291, + "eval_samples_per_second": 16.275, + "eval_scarebleu_bp": 0.9893689487007976, + "eval_scarebleu_counts": [ + 104343, + 40069, + 16861, + 7199 + ], + "eval_scarebleu_precisions": [ + 42.06768372333048, + 17.35783504663383, + 7.8911036125632394, + 3.6619546363224798 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.924275230332398, + "eval_scarebleu_sys_len": 248036, + "eval_scarebleu_totals": [ + 248036, + 230841, + 213671, + 196589 + ], + "eval_steps_per_second": 0.509, + "eval_ter_num_edits": 155528, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.22256364227523, + "step": 225000 + }, + { + "epoch": 88.33, + "learning_rate": 2.8148341887090408e-05, + "loss": 1.7045, + "step": 225500 + }, + { + "epoch": 88.33, + "eval_bleu_bleu": 0.10284770872512213, + "eval_bleu_brevity_penalty": 0.9625785206946118, + "eval_bleu_length_ratio": 0.9632615547320578, + "eval_bleu_precisions": [ + 0.39551247140834334, + 0.15679367023030188, + 0.0687759389250397, + 0.030556849888001256 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229525, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.677842735806955, + "eval_chrf_word_order": 2, + "eval_loss": 2.0366644859313965, + "eval_meteor": 0.3118340127856743, + "eval_runtime": 943.2241, + "eval_samples_per_second": 18.233, + "eval_scarebleu_bp": 0.9875491310978763, + "eval_scarebleu_counts": [ + 104525, + 40133, + 16926, + 7274 + ], + "eval_scarebleu_precisions": [ + 42.2178241815942, + 17.41959286427362, + 7.938391404062528, + 3.708594415185149 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.979195014629347, + "eval_scarebleu_sys_len": 247585, + "eval_scarebleu_totals": [ + 247585, + 230390, + 213217, + 196139 + ], + "eval_steps_per_second": 0.57, + "eval_ter_num_edits": 155293, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.11494763450857, + "step": 225500 + }, + { + "epoch": 88.52, + "learning_rate": 2.8098993288590604e-05, + "loss": 1.7169, + "step": 226000 + }, + { + "epoch": 88.52, + "eval_bleu_bleu": 0.10300038470548602, + "eval_bleu_brevity_penalty": 0.964470669967814, + "eval_bleu_length_ratio": 0.9650871457409171, + "eval_bleu_precisions": [ + 0.39526004522525654, + 0.15706060677273048, + 0.06888918427026032, + 0.0304157169338986 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229960, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.724068851994424, + "eval_chrf_word_order": 2, + "eval_loss": 2.0325467586517334, + "eval_meteor": 0.3125492603382309, + "eval_runtime": 1034.9394, + "eval_samples_per_second": 16.617, + "eval_scarebleu_bp": 0.9894173248732541, + "eval_scarebleu_counts": [ + 104588, + 40270, + 16974, + 7253 + ], + "eval_scarebleu_precisions": [ + 42.16441978971812, + 17.444001160911924, + 7.943691237791266, + 3.6892542141832574 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.988581606030756, + "eval_scarebleu_sys_len": 248048, + "eval_scarebleu_totals": [ + 248048, + 230853, + 213679, + 196598 + ], + "eval_steps_per_second": 0.52, + "eval_ter_num_edits": 155286, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.11174205129849, + "step": 226000 + }, + { + "epoch": 88.72, + "learning_rate": 2.8049644690090804e-05, + "loss": 1.7208, + "step": 226500 + }, + { + "epoch": 88.72, + "eval_bleu_bleu": 0.10287586267565511, + "eval_bleu_brevity_penalty": 0.9626481781115906, + "eval_bleu_length_ratio": 0.9633287029070963, + "eval_bleu_precisions": [ + 0.3949403374560536, + 0.15689487911239203, + 0.06880545935200935, + 0.03059288448800422 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229541, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.72498133105532, + "eval_chrf_word_order": 2, + "eval_loss": 2.035614013671875, + "eval_meteor": 0.3116207451396135, + "eval_runtime": 1096.6994, + "eval_samples_per_second": 15.682, + "eval_scarebleu_bp": 0.9872138632984448, + "eval_scarebleu_counts": [ + 104371, + 40179, + 16965, + 7294 + ], + "eval_scarebleu_precisions": [ + 42.16976024436166, + 17.445844025583245, + 7.959706478492605, + 3.720308682590445 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.99370967671915, + "eval_scarebleu_sys_len": 247502, + "eval_scarebleu_totals": [ + 247502, + 230307, + 213136, + 196059 + ], + "eval_steps_per_second": 0.491, + "eval_ter_num_edits": 155350, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.1410502406477, + "step": 226500 + }, + { + "epoch": 88.92, + "learning_rate": 2.8000296091591e-05, + "loss": 1.7245, + "step": 227000 + }, + { + "epoch": 88.92, + "eval_bleu_bleu": 0.10285961410805235, + "eval_bleu_brevity_penalty": 0.9622693595531006, + "eval_bleu_length_ratio": 0.9629635847053244, + "eval_bleu_precisions": [ + 0.39430997062592066, + 0.1566011335208401, + 0.06889870731632308, + 0.030686630199148593 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229454, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.67746991145489, + "eval_chrf_word_order": 2, + "eval_loss": 2.0311026573181152, + "eval_meteor": 0.31057118677615003, + "eval_runtime": 1112.8211, + "eval_samples_per_second": 15.454, + "eval_scarebleu_bp": 0.9845763296301503, + "eval_scarebleu_counts": [ + 104000, + 39946, + 16878, + 7271 + ], + "eval_scarebleu_precisions": [ + 42.13084869353859, + 17.393916962400123, + 7.94326107623234, + 3.720989739259487 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.944366424282398, + "eval_scarebleu_sys_len": 246850, + "eval_scarebleu_totals": [ + 246850, + 229655, + 212482, + 195405 + ], + "eval_steps_per_second": 0.483, + "eval_ter_num_edits": 155513, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.21569453539651, + "step": 227000 + }, + { + "epoch": 89.11, + "learning_rate": 2.7951046190288198e-05, + "loss": 1.7104, + "step": 227500 + }, + { + "epoch": 89.11, + "eval_bleu_bleu": 0.10301501717305268, + "eval_bleu_brevity_penalty": 0.9656303507714037, + "eval_bleu_length_ratio": 0.9662076809118723, + "eval_bleu_precisions": [ + 0.39440204667567225, + 0.15668538060009765, + 0.06877450579970593, + 0.030476382201792794 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230227, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.80452985273546, + "eval_chrf_word_order": 2, + "eval_loss": 2.034712314605713, + "eval_meteor": 0.31227619717839067, + "eval_runtime": 1120.518, + "eval_samples_per_second": 15.348, + "eval_scarebleu_bp": 0.9904810150694247, + "eval_scarebleu_counts": [ + 104565, + 40221, + 16943, + 7248 + ], + "eval_scarebleu_precisions": [ + 42.1103289410097, + 17.402873869079297, + 7.919362076057286, + 3.6817108170573745 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.975220684636167, + "eval_scarebleu_sys_len": 248312, + "eval_scarebleu_totals": [ + 248312, + 231117, + 213944, + 196865 + ], + "eval_steps_per_second": 0.48, + "eval_ter_num_edits": 155398, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.16303138265963, + "step": 227500 + }, + { + "epoch": 89.31, + "learning_rate": 2.7901697591788394e-05, + "loss": 1.7009, + "step": 228000 + }, + { + "epoch": 89.31, + "eval_bleu_bleu": 0.10261847209539177, + "eval_bleu_brevity_penalty": 0.9625959354867255, + "eval_bleu_length_ratio": 0.9632783417758174, + "eval_bleu_precisions": [ + 0.39474314792466314, + 0.156738911337798, + 0.06888724932624223, + 0.030303710773030932 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229529, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.656043635572985, + "eval_chrf_word_order": 2, + "eval_loss": 2.0333034992218018, + "eval_meteor": 0.3115009893551669, + "eval_runtime": 1115.5532, + "eval_samples_per_second": 15.417, + "eval_scarebleu_bp": 0.9855277650318643, + "eval_scarebleu_counts": [ + 104218, + 40020, + 16903, + 7207 + ], + "eval_scarebleu_precisions": [ + 42.179007224234574, + 17.408325720997, + 7.946238429462619, + 3.683825822049796 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.932937703896773, + "eval_scarebleu_sys_len": 247085, + "eval_scarebleu_totals": [ + 247085, + 229890, + 212717, + 195639 + ], + "eval_steps_per_second": 0.482, + "eval_ter_num_edits": 155402, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.16486314449395, + "step": 228000 + }, + { + "epoch": 89.5, + "learning_rate": 2.785234899328859e-05, + "loss": 1.7142, + "step": 228500 + }, + { + "epoch": 89.5, + "eval_bleu_bleu": 0.10364775245866724, + "eval_bleu_brevity_penalty": 0.9646749026667498, + "eval_bleu_length_ratio": 0.9652843935050928, + "eval_bleu_precisions": [ + 0.3955836126726578, + 0.1573548484108039, + 0.06937352735227523, + 0.03086053412462908 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230007, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.770433723004544, + "eval_chrf_word_order": 2, + "eval_loss": 2.0319104194641113, + "eval_meteor": 0.31289752037573637, + "eval_runtime": 1112.081, + "eval_samples_per_second": 15.465, + "eval_scarebleu_bp": 0.9904528256159585, + "eval_scarebleu_counts": [ + 104747, + 40363, + 17089, + 7326 + ], + "eval_scarebleu_precisions": [ + 42.18481303235939, + 17.464843580978755, + 7.987902924239025, + 3.7213696834854697 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.048913899203933, + "eval_scarebleu_sys_len": 248305, + "eval_scarebleu_totals": [ + 248305, + 231110, + 213936, + 196863 + ], + "eval_steps_per_second": 0.484, + "eval_ter_num_edits": 155122, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.03663981609111, + "step": 228500 + }, + { + "epoch": 89.7, + "learning_rate": 2.7803000394788793e-05, + "loss": 1.7141, + "step": 229000 + }, + { + "epoch": 89.7, + "eval_bleu_bleu": 0.10299406241083063, + "eval_bleu_brevity_penalty": 0.9629659308156368, + "eval_bleu_length_ratio": 0.9636350664557095, + "eval_bleu_precisions": [ + 0.3955333734005766, + 0.15725523611353034, + 0.06903651048095094, + 0.030474597955267264 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229614, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.77294170703882, + "eval_chrf_word_order": 2, + "eval_loss": 2.0325675010681152, + "eval_meteor": 0.3121184010930496, + "eval_runtime": 1120.6493, + "eval_samples_per_second": 15.346, + "eval_scarebleu_bp": 0.9878802505554072, + "eval_scarebleu_counts": [ + 104558, + 40246, + 17011, + 7286 + ], + "eval_scarebleu_precisions": [ + 42.21717063637868, + 17.46242493665174, + 7.975189757101534, + 3.7131601612467575 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.008089028049723, + "eval_scarebleu_sys_len": 247667, + "eval_scarebleu_totals": [ + 247667, + 230472, + 213299, + 196221 + ], + "eval_steps_per_second": 0.48, + "eval_ter_num_edits": 155206, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.07510681461197, + "step": 229000 + }, + { + "epoch": 89.89, + "learning_rate": 2.7753750493485984e-05, + "loss": 1.7165, + "step": 229500 + }, + { + "epoch": 89.89, + "eval_bleu_bleu": 0.10365013509955096, + "eval_bleu_brevity_penalty": 0.964787865174825, + "eval_bleu_length_ratio": 0.9653935092895304, + "eval_bleu_precisions": [ + 0.3946955436828629, + 0.15727924524755918, + 0.06931866963756414, + 0.03095767252044718 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230033, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.77855936140525, + "eval_chrf_word_order": 2, + "eval_loss": 2.0331504344940186, + "eval_meteor": 0.3121516968292642, + "eval_runtime": 1111.8474, + "eval_samples_per_second": 15.468, + "eval_scarebleu_bp": 0.9862882715848733, + "eval_scarebleu_counts": [ + 104307, + 40195, + 17048, + 7364 + ], + "eval_scarebleu_precisions": [ + 42.18293141588447, + 17.470162292787663, + 8.007327211667176, + 3.7604620404745006 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.03772697836946, + "eval_scarebleu_sys_len": 247273, + "eval_scarebleu_totals": [ + 247273, + 230078, + 212905, + 195827 + ], + "eval_steps_per_second": 0.484, + "eval_ter_num_edits": 155413, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.16990048953835, + "step": 229500 + }, + { + "epoch": 90.09, + "learning_rate": 2.770440189498618e-05, + "loss": 1.7026, + "step": 230000 + }, + { + "epoch": 90.09, + "eval_bleu_bleu": 0.10299685738570834, + "eval_bleu_brevity_penalty": 0.9622650045138852, + "eval_bleu_length_ratio": 0.9629593879443845, + "eval_bleu_precisions": [ + 0.3953576549445856, + 0.157242600985593, + 0.0690784584078689, + 0.03056427652751178 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229453, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.76649453160326, + "eval_chrf_word_order": 2, + "eval_loss": 2.032963514328003, + "eval_meteor": 0.3116247944331963, + "eval_runtime": 1084.8157, + "eval_samples_per_second": 15.853, + "eval_scarebleu_bp": 0.9867006482898009, + "eval_scarebleu_counts": [ + 104444, + 40226, + 17017, + 7285 + ], + "eval_scarebleu_precisions": [ + 42.22091965639212, + 17.47588843513772, + 7.988939330632326, + 3.7181836277427025 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.00555221591265, + "eval_scarebleu_sys_len": 247375, + "eval_scarebleu_totals": [ + 247375, + 230180, + 213007, + 195929 + ], + "eval_steps_per_second": 0.496, + "eval_ter_num_edits": 155197, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.07098535048473, + "step": 230000 + }, + { + "epoch": 90.29, + "learning_rate": 2.7655053296486384e-05, + "loss": 1.6926, + "step": 230500 + }, + { + "epoch": 90.29, + "eval_bleu_bleu": 0.10307681306308539, + "eval_bleu_brevity_penalty": 0.9640664313635212, + "eval_bleu_length_ratio": 0.9646968469735059, + "eval_bleu_precisions": [ + 0.39571578347479197, + 0.15703994884140837, + 0.06882441998445109, + 0.03055483957728643 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229867, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.758734350072466, + "eval_chrf_word_order": 2, + "eval_loss": 2.031848192214966, + "eval_meteor": 0.3126003032934088, + "eval_runtime": 1122.0514, + "eval_samples_per_second": 15.327, + "eval_scarebleu_bp": 0.9894415120912099, + "eval_scarebleu_counts": [ + 104762, + 40298, + 16981, + 7287 + ], + "eval_scarebleu_precisions": [ + 42.23354592145259, + 17.45567640854374, + 7.9467068502382, + 3.70635986328125 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.010812259473768, + "eval_scarebleu_sys_len": 248054, + "eval_scarebleu_totals": [ + 248054, + 230859, + 213686, + 196608 + ], + "eval_steps_per_second": 0.479, + "eval_ter_num_edits": 155152, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.05037802984856, + "step": 230500 + }, + { + "epoch": 90.48, + "learning_rate": 2.760570469798658e-05, + "loss": 1.703, + "step": 231000 + }, + { + "epoch": 90.48, + "eval_bleu_bleu": 0.10352787174571614, + "eval_bleu_brevity_penalty": 0.9665198620251509, + "eval_bleu_length_ratio": 0.967068016904553, + "eval_bleu_precisions": [ + 0.3953921330370782, + 0.15705529528177567, + 0.0690392039861891, + 0.030705037257158178 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230432, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.81653973605107, + "eval_chrf_word_order": 2, + "eval_loss": 2.0334129333496094, + "eval_meteor": 0.3129633868465815, + "eval_runtime": 1108.9438, + "eval_samples_per_second": 15.508, + "eval_scarebleu_bp": 0.9907266327099421, + "eval_scarebleu_counts": [ + 104834, + 40401, + 17097, + 7355 + ], + "eval_scarebleu_precisions": [ + 42.20829156148213, + 17.476143923729765, + 7.989065676035606, + 3.734943429952672 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.067288322302433, + "eval_scarebleu_sys_len": 248373, + "eval_scarebleu_totals": [ + 248373, + 231178, + 214005, + 196924 + ], + "eval_steps_per_second": 0.485, + "eval_ter_num_edits": 155095, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.0242754237094, + "step": 231000 + }, + { + "epoch": 90.68, + "learning_rate": 2.7556454796683778e-05, + "loss": 1.7042, + "step": 231500 + }, + { + "epoch": 90.68, + "eval_bleu_bleu": 0.10343269361535111, + "eval_bleu_brevity_penalty": 0.9663723861983586, + "eval_bleu_length_ratio": 0.9669253270325963, + "eval_bleu_precisions": [ + 0.3949556853792134, + 0.15705219907787413, + 0.068943706514864, + 0.030687836599700553 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230398, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.80511357910285, + "eval_chrf_word_order": 2, + "eval_loss": 2.0329627990722656, + "eval_meteor": 0.3125717961021219, + "eval_runtime": 1106.9912, + "eval_samples_per_second": 15.536, + "eval_scarebleu_bp": 0.9872340632955491, + "eval_scarebleu_counts": [ + 104420, + 40245, + 16982, + 7314 + ], + "eval_scarebleu_precisions": [ + 42.18870577397811, + 17.474122060509224, + 7.967458314175526, + 3.7304716389287007 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.011269440436365, + "eval_scarebleu_sys_len": 247507, + "eval_scarebleu_totals": [ + 247507, + 230312, + 213142, + 196061 + ], + "eval_steps_per_second": 0.486, + "eval_ter_num_edits": 155272, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.10533088487834, + "step": 231500 + }, + { + "epoch": 90.87, + "learning_rate": 2.7507106198183974e-05, + "loss": 1.7098, + "step": 232000 + }, + { + "epoch": 90.87, + "eval_bleu_bleu": 0.10332274825792401, + "eval_bleu_brevity_penalty": 0.9629354655918478, + "eval_bleu_length_ratio": 0.9636056891291301, + "eval_bleu_precisions": [ + 0.39605499832322183, + 0.1578818522494021, + 0.06926433532050888, + 0.030605373616753834 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229607, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.74621026639601, + "eval_chrf_word_order": 2, + "eval_loss": 2.030024528503418, + "eval_meteor": 0.3124596924789878, + "eval_runtime": 1097.2631, + "eval_samples_per_second": 15.674, + "eval_scarebleu_bp": 0.9861831291206417, + "eval_scarebleu_counts": [ + 104521, + 40299, + 17028, + 7274 + ], + "eval_scarebleu_precisions": [ + 42.273920411572234, + 17.517343904856293, + 7.998910179021886, + 3.7149394292251436 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.0112554483431, + "eval_scarebleu_sys_len": 247247, + "eval_scarebleu_totals": [ + 247247, + 230052, + 212879, + 195804 + ], + "eval_steps_per_second": 0.49, + "eval_ter_num_edits": 155094, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.02381748325082, + "step": 232000 + }, + { + "epoch": 91.07, + "learning_rate": 2.745775759968417e-05, + "loss": 1.7093, + "step": 232500 + }, + { + "epoch": 91.07, + "eval_bleu_bleu": 0.10292907636322492, + "eval_bleu_brevity_penalty": 0.9614502913047812, + "eval_bleu_length_ratio": 0.962174593648622, + "eval_bleu_precisions": [ + 0.39635183585878414, + 0.15732938497012794, + 0.06882150736237237, + 0.030607655287185714 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229266, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.72849279984333, + "eval_chrf_word_order": 2, + "eval_loss": 2.0297763347625732, + "eval_meteor": 0.3124403156329392, + "eval_runtime": 1088.1984, + "eval_samples_per_second": 15.804, + "eval_scarebleu_bp": 0.9879771430829702, + "eval_scarebleu_counts": [ + 104670, + 40247, + 16966, + 7289 + ], + "eval_scarebleu_precisions": [ + 42.2582976369751, + 17.461040538664445, + 7.953197733015193, + 3.7141969049208394 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.004500741949697, + "eval_scarebleu_sys_len": 247691, + "eval_scarebleu_totals": [ + 247691, + 230496, + 213323, + 196247 + ], + "eval_steps_per_second": 0.494, + "eval_ter_num_edits": 155057, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.00687368628331, + "step": 232500 + }, + { + "epoch": 91.27, + "learning_rate": 2.7408409001184367e-05, + "loss": 1.6939, + "step": 233000 + }, + { + "epoch": 91.27, + "eval_bleu_bleu": 0.10367264145151078, + "eval_bleu_brevity_penalty": 0.9654219645042712, + "eval_bleu_length_ratio": 0.9660062363867568, + "eval_bleu_precisions": [ + 0.39526194830979366, + 0.15737332381775157, + 0.06926152699121145, + 0.030865958506038384 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230179, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.83984636486258, + "eval_chrf_word_order": 2, + "eval_loss": 2.032769203186035, + "eval_meteor": 0.3127392734966889, + "eval_runtime": 1079.4936, + "eval_samples_per_second": 15.932, + "eval_scarebleu_bp": 0.9876904758204814, + "eval_scarebleu_counts": [ + 104516, + 40240, + 17028, + 7319 + ], + "eval_scarebleu_precisions": [ + 42.20822227606817, + 17.463382879461864, + 7.984956694224177, + 3.7309286285944405 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.023325419151664, + "eval_scarebleu_sys_len": 247620, + "eval_scarebleu_totals": [ + 247620, + 230425, + 213251, + 196171 + ], + "eval_steps_per_second": 0.498, + "eval_ter_num_edits": 155222, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.08243386194927, + "step": 233000 + }, + { + "epoch": 91.46, + "learning_rate": 2.7359159099881564e-05, + "loss": 1.6963, + "step": 233500 + }, + { + "epoch": 91.46, + "eval_bleu_bleu": 0.10380630803914208, + "eval_bleu_brevity_penalty": 0.9662205508905847, + "eval_bleu_length_ratio": 0.9667784403996995, + "eval_bleu_precisions": [ + 0.39506778432300327, + 0.15722810177887864, + 0.06928692777446163, + 0.030955427536920214 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230363, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.841361071343535, + "eval_chrf_word_order": 2, + "eval_loss": 2.032151222229004, + "eval_meteor": 0.31278375412972975, + "eval_runtime": 1088.8666, + "eval_samples_per_second": 15.794, + "eval_scarebleu_bp": 0.9886188218682643, + "eval_scarebleu_counts": [ + 104509, + 40266, + 17045, + 7355 + ], + "eval_scarebleu_precisions": [ + 42.16622957433932, + 17.45724133446056, + 7.9841675059137645, + 3.7446986166762555 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.04136159591552, + "eval_scarebleu_sys_len": 247850, + "eval_scarebleu_totals": [ + 247850, + 230655, + 213485, + 196411 + ], + "eval_steps_per_second": 0.494, + "eval_ter_num_edits": 155184, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.06503212452317, + "step": 233500 + }, + { + "epoch": 91.66, + "learning_rate": 2.730981050138176e-05, + "loss": 1.701, + "step": 234000 + }, + { + "epoch": 91.66, + "eval_bleu_bleu": 0.10345196301236911, + "eval_bleu_brevity_penalty": 0.9654480150805774, + "eval_bleu_length_ratio": 0.9660314169523961, + "eval_bleu_precisions": [ + 0.3950170515020527, + 0.1570965773040988, + 0.06910656290213861, + 0.03074238152772184 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230185, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.74996558265536, + "eval_chrf_word_order": 2, + "eval_loss": 2.0321128368377686, + "eval_meteor": 0.3120641596910749, + "eval_runtime": 1073.6696, + "eval_samples_per_second": 16.018, + "eval_scarebleu_bp": 0.9887842202242363, + "eval_scarebleu_counts": [ + 104510, + 40169, + 16973, + 7300 + ], + "eval_scarebleu_precisions": [ + 42.15965888233135, + 17.412092103894302, + 7.949026568566384, + 3.7161285067781167 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.998852264023165, + "eval_scarebleu_sys_len": 247891, + "eval_scarebleu_totals": [ + 247891, + 230696, + 213523, + 196441 + ], + "eval_steps_per_second": 0.501, + "eval_ter_num_edits": 155274, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.1062467657955, + "step": 234000 + }, + { + "epoch": 91.85, + "learning_rate": 2.726046190288196e-05, + "loss": 1.7062, + "step": 234500 + }, + { + "epoch": 91.85, + "eval_bleu_bleu": 0.10340088389551776, + "eval_bleu_brevity_penalty": 0.9652309069248042, + "eval_bleu_length_ratio": 0.9658215789054008, + "eval_bleu_precisions": [ + 0.39567210550329157, + 0.1573917535455997, + 0.06909867298675029, + 0.0306044804511783 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230135, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.866985610564136, + "eval_chrf_word_order": 2, + "eval_loss": 2.0299034118652344, + "eval_meteor": 0.3131692776195573, + "eval_runtime": 1086.7267, + "eval_samples_per_second": 15.826, + "eval_scarebleu_bp": 0.9877712353750262, + "eval_scarebleu_counts": [ + 104600, + 40288, + 17032, + 7291 + ], + "eval_scarebleu_precisions": [ + 42.2387336456146, + 17.482696521946668, + 7.9860834337533, + 3.716276485669577 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.018400357955048, + "eval_scarebleu_sys_len": 247640, + "eval_scarebleu_totals": [ + 247640, + 230445, + 213271, + 196191 + ], + "eval_steps_per_second": 0.495, + "eval_ter_num_edits": 155095, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.0242754237094, + "step": 234500 + }, + { + "epoch": 92.05, + "learning_rate": 2.7211113304382157e-05, + "loss": 1.694, + "step": 235000 + }, + { + "epoch": 92.05, + "eval_bleu_bleu": 0.10364827418886252, + "eval_bleu_brevity_penalty": 0.9681363791528796, + "eval_bleu_length_ratio": 0.9686334087351383, + "eval_bleu_precisions": [ + 0.395580684993826, + 0.157263236739853, + 0.06891900146603681, + 0.030640854844733306 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230805, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.861275896026186, + "eval_chrf_word_order": 2, + "eval_loss": 2.0303568840026855, + "eval_meteor": 0.3136447699771708, + "eval_runtime": 1080.7868, + "eval_samples_per_second": 15.912, + "eval_scarebleu_bp": 0.9907789697283386, + "eval_scarebleu_counts": [ + 104883, + 40375, + 17063, + 7332 + ], + "eval_scarebleu_precisions": [ + 42.22580982825119, + 17.46391511780303, + 7.972693885561028, + 3.7229991164732046 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.051224729005419, + "eval_scarebleu_sys_len": 248386, + "eval_scarebleu_totals": [ + 248386, + 231191, + 214018, + 196938 + ], + "eval_steps_per_second": 0.498, + "eval_ter_num_edits": 155052, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.0045839839904, + "step": 235000 + }, + { + "epoch": 92.24, + "learning_rate": 2.716186340307935e-05, + "loss": 1.6952, + "step": 235500 + }, + { + "epoch": 92.24, + "eval_bleu_bleu": 0.10332129564310935, + "eval_bleu_brevity_penalty": 0.9660469975453495, + "eval_bleu_length_ratio": 0.9666105699621033, + "eval_bleu_precisions": [ + 0.39585712238899284, + 0.15740306294808754, + 0.06904188438928804, + 0.030415998300907115 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230323, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.85848425402393, + "eval_chrf_word_order": 2, + "eval_loss": 2.028691053390503, + "eval_meteor": 0.3133388512389026, + "eval_runtime": 1097.2612, + "eval_samples_per_second": 15.674, + "eval_scarebleu_bp": 0.988630925104152, + "eval_scarebleu_counts": [ + 104758, + 40327, + 17037, + 7296 + ], + "eval_scarebleu_precisions": [ + 42.266181970764926, + 17.483460361227444, + 7.980420170035366, + 3.714754131747503 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.02757994699251, + "eval_scarebleu_sys_len": 247853, + "eval_scarebleu_totals": [ + 247853, + 230658, + 213485, + 196406 + ], + "eval_steps_per_second": 0.49, + "eval_ter_num_edits": 155103, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.02793894737806, + "step": 235500 + }, + { + "epoch": 92.44, + "learning_rate": 2.7112514804579554e-05, + "loss": 1.6817, + "step": 236000 + }, + { + "epoch": 92.44, + "eval_bleu_bleu": 0.10336611233957835, + "eval_bleu_brevity_penalty": 0.9650789041406536, + "eval_bleu_length_ratio": 0.9656746922725041, + "eval_bleu_precisions": [ + 0.3944545849630595, + 0.15716869026091448, + 0.06925847403509668, + 0.030649647168111385 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230100, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.86826950507065, + "eval_chrf_word_order": 2, + "eval_loss": 2.0296735763549805, + "eval_meteor": 0.31218965168987667, + "eval_runtime": 1100.027, + "eval_samples_per_second": 15.634, + "eval_scarebleu_bp": 0.9892681575711707, + "eval_scarebleu_counts": [ + 104492, + 40296, + 17098, + 7334 + ], + "eval_scarebleu_precisions": [ + 42.13200220957941, + 17.458061832801885, + 8.003070542915049, + 3.731100303209133 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.043132208586655, + "eval_scarebleu_sys_len": 248011, + "eval_scarebleu_totals": [ + 248011, + 230816, + 213643, + 196564 + ], + "eval_steps_per_second": 0.489, + "eval_ter_num_edits": 155414, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.17035842999692, + "step": 236000 + }, + { + "epoch": 92.64, + "learning_rate": 2.7063166206079747e-05, + "loss": 1.6935, + "step": 236500 + }, + { + "epoch": 92.64, + "eval_bleu_bleu": 0.10357336975627085, + "eval_bleu_brevity_penalty": 0.9659037941272649, + "eval_bleu_length_ratio": 0.9664720768510864, + "eval_bleu_precisions": [ + 0.39547092796039773, + 0.15765738285741102, + 0.06933457184562149, + 0.03058286889782046 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230290, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.85739139638304, + "eval_chrf_word_order": 2, + "eval_loss": 2.0286266803741455, + "eval_meteor": 0.31317331048556446, + "eval_runtime": 955.6457, + "eval_samples_per_second": 17.996, + "eval_scarebleu_bp": 0.9924603604625479, + "eval_scarebleu_counts": [ + 104909, + 40526, + 17179, + 7353 + ], + "eval_scarebleu_precisions": [ + 42.165318885548466, + 17.49759292600892, + 8.01124811132459, + 3.7256789623023914 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.089908030346873, + "eval_scarebleu_sys_len": 248804, + "eval_scarebleu_totals": [ + 248804, + 231609, + 214436, + 197360 + ], + "eval_steps_per_second": 0.563, + "eval_ter_num_edits": 155079, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.0169483763721, + "step": 236500 + }, + { + "epoch": 92.83, + "learning_rate": 2.7013817607579944e-05, + "loss": 1.7028, + "step": 237000 + }, + { + "epoch": 92.83, + "eval_bleu_bleu": 0.10345675072440158, + "eval_bleu_brevity_penalty": 0.9634010507326192, + "eval_bleu_length_ratio": 0.9640547425497001, + "eval_bleu_precisions": [ + 0.3958052186632073, + 0.1578729431250853, + 0.06933901176807826, + 0.030693047096694594 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229714, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.89573379005967, + "eval_chrf_word_order": 2, + "eval_loss": 2.0299320220947266, + "eval_meteor": 0.3131779311909076, + "eval_runtime": 937.2276, + "eval_samples_per_second": 18.35, + "eval_scarebleu_bp": 0.9860658419705685, + "eval_scarebleu_counts": [ + 104504, + 40316, + 17048, + 7314 + ], + "eval_scarebleu_precisions": [ + 42.27200284768909, + 17.526942957878124, + 8.009396288466055, + 3.7359404210977964 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.03221532626436, + "eval_scarebleu_sys_len": 247218, + "eval_scarebleu_totals": [ + 247218, + 230023, + 212850, + 195774 + ], + "eval_steps_per_second": 0.574, + "eval_ter_num_edits": 155184, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.06503212452317, + "step": 237000 + }, + { + "epoch": 93.03, + "learning_rate": 2.6964567706277145e-05, + "loss": 1.6948, + "step": 237500 + }, + { + "epoch": 93.03, + "eval_bleu_bleu": 0.1037765775719339, + "eval_bleu_brevity_penalty": 0.9640012168311239, + "eval_bleu_length_ratio": 0.9646338955594073, + "eval_bleu_precisions": [ + 0.396964133442389, + 0.15807144838871987, + 0.06960720624868924, + 0.03074879795568407 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229852, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.841462796801636, + "eval_chrf_word_order": 2, + "eval_loss": 2.0258073806762695, + "eval_meteor": 0.3138342215559259, + "eval_runtime": 941.5434, + "eval_samples_per_second": 18.266, + "eval_scarebleu_bp": 0.9899331933334048, + "eval_scarebleu_counts": [ + 105117, + 40554, + 17193, + 7371 + ], + "eval_scarebleu_precisions": [ + 42.35582812197795, + 17.557288261805084, + 8.0412891880136, + 3.7468357004158066 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.111449526122628, + "eval_scarebleu_sys_len": 248176, + "eval_scarebleu_totals": [ + 248176, + 230981, + 213809, + 196726 + ], + "eval_steps_per_second": 0.571, + "eval_ter_num_edits": 154888, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 70.92948174878302, + "step": 237500 + }, + { + "epoch": 93.22, + "learning_rate": 2.691521910777734e-05, + "loss": 1.6753, + "step": 238000 + }, + { + "epoch": 93.22, + "eval_bleu_bleu": 0.10388886342809993, + "eval_bleu_brevity_penalty": 0.9663420209188885, + "eval_bleu_length_ratio": 0.9668959497060169, + "eval_bleu_precisions": [ + 0.3952107504199383, + 0.15765305165200097, + 0.06946754134486875, + 0.030863093907835336 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230391, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.914268692738204, + "eval_chrf_word_order": 2, + "eval_loss": 2.031459331512451, + "eval_meteor": 0.31369800634000394, + "eval_runtime": 944.3155, + "eval_samples_per_second": 18.212, + "eval_scarebleu_bp": 0.9885704074764696, + "eval_scarebleu_counts": [ + 104609, + 40377, + 17114, + 7346 + ], + "eval_scarebleu_precisions": [ + 42.20862014703153, + 17.506275932935317, + 8.01705157633391, + 3.7405734595467113 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.061312040959018, + "eval_scarebleu_sys_len": 247838, + "eval_scarebleu_totals": [ + 247838, + 230643, + 213470, + 196387 + ], + "eval_steps_per_second": 0.57, + "eval_ter_num_edits": 155135, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.04259304205267, + "step": 238000 + }, + { + "epoch": 93.42, + "learning_rate": 2.6865870509277534e-05, + "loss": 1.6766, + "step": 238500 + }, + { + "epoch": 93.42, + "eval_bleu_bleu": 0.10371390477297744, + "eval_bleu_brevity_penalty": 0.9672612600699373, + "eval_bleu_length_ratio": 0.9677856630252771, + "eval_bleu_precisions": [ + 0.3946305989080801, + 0.15720591542959964, + 0.06925420896009131, + 0.0307657107141462 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230603, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.888815758346894, + "eval_chrf_word_order": 2, + "eval_loss": 2.0295872688293457, + "eval_meteor": 0.3132891377129046, + "eval_runtime": 944.3856, + "eval_samples_per_second": 18.211, + "eval_scarebleu_bp": 0.9910003655490124, + "eval_scarebleu_counts": [ + 104662, + 40384, + 17103, + 7361 + ], + "eval_scarebleu_precisions": [ + 42.127507134490685, + 17.463653425356547, + 7.989330742316874, + 3.7367758442138608 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.064265680728566, + "eval_scarebleu_sys_len": 248441, + "eval_scarebleu_totals": [ + 248441, + 231246, + 214073, + 196988 + ], + "eval_steps_per_second": 0.57, + "eval_ter_num_edits": 155293, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.11494763450857, + "step": 238500 + }, + { + "epoch": 93.62, + "learning_rate": 2.6816521910777737e-05, + "loss": 1.69, + "step": 239000 + }, + { + "epoch": 93.62, + "eval_bleu_bleu": 0.10303020383536997, + "eval_bleu_brevity_penalty": 0.9664417892056989, + "eval_bleu_length_ratio": 0.9669924752076348, + "eval_bleu_precisions": [ + 0.3950063798206706, + 0.15687626337240115, + 0.06876536535106959, + 0.030312679817431187 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230414, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.88135445808661, + "eval_chrf_word_order": 2, + "eval_loss": 2.0279436111450195, + "eval_meteor": 0.3123722588882045, + "eval_runtime": 940.6824, + "eval_samples_per_second": 18.282, + "eval_scarebleu_bp": 0.9892076780690625, + "eval_scarebleu_counts": [ + 104583, + 40229, + 16963, + 7263 + ], + "eval_scarebleu_precisions": [ + 42.17124469749512, + 17.430167113660687, + 7.940438519295223, + 3.695468560787227 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.987965131898331, + "eval_scarebleu_sys_len": 247996, + "eval_scarebleu_totals": [ + 247996, + 230801, + 213628, + 196538 + ], + "eval_steps_per_second": 0.572, + "eval_ter_num_edits": 155293, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.11494763450857, + "step": 239000 + }, + { + "epoch": 93.81, + "learning_rate": 2.6767173312277933e-05, + "loss": 1.6976, + "step": 239500 + }, + { + "epoch": 93.81, + "eval_bleu_bleu": 0.10369293319198665, + "eval_bleu_brevity_penalty": 0.9620472292828396, + "eval_bleu_length_ratio": 0.9627495498973891, + "eval_bleu_precisions": [ + 0.39708286290937783, + 0.15838234185327604, + 0.06969089501504766, + 0.03079265380877206 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229403, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.85770520172085, + "eval_chrf_word_order": 2, + "eval_loss": 2.025296688079834, + "eval_meteor": 0.3132205135599489, + "eval_runtime": 921.0639, + "eval_samples_per_second": 18.672, + "eval_scarebleu_bp": 0.9869108149978911, + "eval_scarebleu_counts": [ + 104826, + 40475, + 17113, + 7315 + ], + "eval_scarebleu_precisions": [ + 42.36643535264947, + 17.580093123458077, + 8.032009762508213, + 3.732580864080989 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.06415880618449, + "eval_scarebleu_sys_len": 247427, + "eval_scarebleu_totals": [ + 247427, + 230232, + 213060, + 195977 + ], + "eval_steps_per_second": 0.584, + "eval_ter_num_edits": 154936, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 70.95146289079494, + "step": 239500 + }, + { + "epoch": 94.01, + "learning_rate": 2.671792341097513e-05, + "loss": 1.7002, + "step": 240000 + }, + { + "epoch": 94.01, + "eval_bleu_bleu": 0.10360290684378064, + "eval_bleu_brevity_penalty": 0.9644619783222124, + "eval_bleu_length_ratio": 0.9650787522190374, + "eval_bleu_precisions": [ + 0.39578966593899756, + 0.15774829270126856, + 0.0694519000219833, + 0.03070676523297491 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229958, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.91676614854053, + "eval_chrf_word_order": 2, + "eval_loss": 2.0266661643981934, + "eval_meteor": 0.3130376610167476, + "eval_runtime": 939.9764, + "eval_samples_per_second": 18.296, + "eval_scarebleu_bp": 0.9862195258228535, + "eval_scarebleu_counts": [ + 104523, + 40320, + 17077, + 7313 + ], + "eval_scarebleu_precisions": [ + 42.273190539360016, + 17.52578663919569, + 8.021588816654766, + 3.734742862979419 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.037588946948045, + "eval_scarebleu_sys_len": 247256, + "eval_scarebleu_totals": [ + 247256, + 230061, + 212888, + 195810 + ], + "eval_steps_per_second": 0.572, + "eval_ter_num_edits": 155178, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.06228448177167, + "step": 240000 + }, + { + "epoch": 94.2, + "learning_rate": 2.6668574812475327e-05, + "loss": 1.6766, + "step": 240500 + }, + { + "epoch": 94.2, + "eval_bleu_bleu": 0.10314572258519114, + "eval_bleu_brevity_penalty": 0.961302093029142, + "eval_bleu_length_ratio": 0.9620319037766651, + "eval_bleu_precisions": [ + 0.3970344454526419, + 0.15801015860439452, + 0.06943831525364587, + 0.03042656800008997 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229232, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.888351989885926, + "eval_chrf_word_order": 2, + "eval_loss": 2.0267841815948486, + "eval_meteor": 0.3128875321980566, + "eval_runtime": 936.4119, + "eval_samples_per_second": 18.366, + "eval_scarebleu_bp": 0.9836726532439343, + "eval_scarebleu_counts": [ + 104553, + 40253, + 17005, + 7232 + ], + "eval_scarebleu_precisions": [ + 42.39316863117177, + 17.544631960668085, + 8.011401111843965, + 3.7051837734263726 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 11.990579988211005, + "eval_scarebleu_sys_len": 246627, + "eval_scarebleu_totals": [ + 246627, + 229432, + 212260, + 195186 + ], + "eval_steps_per_second": 0.575, + "eval_ter_num_edits": 154987, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 70.9748178541826, + "step": 240500 + }, + { + "epoch": 94.4, + "learning_rate": 2.6619226213975524e-05, + "loss": 1.6776, + "step": 241000 + }, + { + "epoch": 94.4, + "eval_bleu_bleu": 0.10329310635033061, + "eval_bleu_brevity_penalty": 0.9635924457338001, + "eval_bleu_length_ratio": 0.964239400031056, + "eval_bleu_precisions": [ + 0.39621253666901696, + 0.15774617407545058, + 0.06933910604804454, + 0.030468180543874405 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229758, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.90344557070067, + "eval_chrf_word_order": 2, + "eval_loss": 2.0283780097961426, + "eval_meteor": 0.31275818852272347, + "eval_runtime": 936.9384, + "eval_samples_per_second": 18.356, + "eval_scarebleu_bp": 0.9865793784374555, + "eval_scarebleu_counts": [ + 104641, + 40292, + 17032, + 7259 + ], + "eval_scarebleu_precisions": [ + 42.30568638945602, + 17.506843363024114, + 7.997107668903215, + 3.705594380605739 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.008296069123922, + "eval_scarebleu_sys_len": 247345, + "eval_scarebleu_totals": [ + 247345, + 230150, + 212977, + 195893 + ], + "eval_steps_per_second": 0.574, + "eval_ter_num_edits": 155185, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.06549006498174, + "step": 241000 + }, + { + "epoch": 94.59, + "learning_rate": 2.6569877615475723e-05, + "loss": 1.6804, + "step": 241500 + }, + { + "epoch": 94.59, + "eval_bleu_bleu": 0.10363600038112908, + "eval_bleu_brevity_penalty": 0.9649268790558998, + "eval_bleu_length_ratio": 0.9655278056396074, + "eval_bleu_precisions": [ + 0.39610979505791843, + 0.15787569878329497, + 0.06942485744067693, + 0.030649196550006436 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230065, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.89479613623014, + "eval_chrf_word_order": 2, + "eval_loss": 2.0260417461395264, + "eval_meteor": 0.31328215315335334, + "eval_runtime": 932.0205, + "eval_samples_per_second": 18.452, + "eval_scarebleu_bp": 0.9877106663130661, + "eval_scarebleu_counts": [ + 104700, + 40396, + 17101, + 7333 + ], + "eval_scarebleu_precisions": [ + 42.281675921251896, + 17.530703467430456, + 8.018963035211037, + 3.73781755902622 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.058733736587133, + "eval_scarebleu_sys_len": 247625, + "eval_scarebleu_totals": [ + 247625, + 230430, + 213257, + 196184 + ], + "eval_steps_per_second": 0.577, + "eval_ter_num_edits": 155084, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.01923807866501, + "step": 241500 + }, + { + "epoch": 94.79, + "learning_rate": 2.6520627714172918e-05, + "loss": 1.6881, + "step": 242000 + }, + { + "epoch": 94.79, + "eval_bleu_bleu": 0.10392186612102852, + "eval_bleu_brevity_penalty": 0.9616812641591826, + "eval_bleu_length_ratio": 0.962397021978437, + "eval_bleu_precisions": [ + 0.39646082531321, + 0.15835549018498615, + 0.07003344207135677, + 0.031014461799603186 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229319, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.930447028464954, + "eval_chrf_word_order": 2, + "eval_loss": 2.0241012573242188, + "eval_meteor": 0.3131498334871809, + "eval_runtime": 950.9693, + "eval_samples_per_second": 18.085, + "eval_scarebleu_bp": 0.9872179033300917, + "eval_scarebleu_counts": [ + 104726, + 40540, + 17268, + 7444 + ], + "eval_scarebleu_precisions": [ + 42.31302246841452, + 17.602514893099674, + 8.10186922903686, + 3.7968356302726742 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.145823656319136, + "eval_scarebleu_sys_len": 247503, + "eval_scarebleu_totals": [ + 247503, + 230308, + 213136, + 196058 + ], + "eval_steps_per_second": 0.566, + "eval_ter_num_edits": 154912, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 70.94047231978898, + "step": 242000 + }, + { + "epoch": 94.99, + "learning_rate": 2.6471279115673114e-05, + "loss": 1.6847, + "step": 242500 + }, + { + "epoch": 94.99, + "eval_bleu_bleu": 0.10451619080041506, + "eval_bleu_brevity_penalty": 0.9650571876368164, + "eval_bleu_length_ratio": 0.9656537084678045, + "eval_bleu_precisions": [ + 0.3962015689171864, + 0.15812588069516204, + 0.070042250139216, + 0.031350383345458616 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230095, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.931606701982744, + "eval_chrf_word_order": 2, + "eval_loss": 2.023048162460327, + "eval_meteor": 0.3138137947441302, + "eval_runtime": 927.1333, + "eval_samples_per_second": 18.55, + "eval_scarebleu_bp": 0.9904085263131372, + "eval_scarebleu_counts": [ + 104973, + 40589, + 17257, + 7460 + ], + "eval_scarebleu_precisions": [ + 42.27770304558306, + 17.56346847022272, + 8.066808148612138, + 3.78972608306917 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.15688126802254, + "eval_scarebleu_sys_len": 248294, + "eval_scarebleu_totals": [ + 248294, + 231099, + 213926, + 196848 + ], + "eval_steps_per_second": 0.58, + "eval_ter_num_edits": 155008, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 70.9844346038128, + "step": 242500 + }, + { + "epoch": 95.18, + "learning_rate": 2.6421930517173317e-05, + "loss": 1.6701, + "step": 243000 + }, + { + "epoch": 95.18, + "eval_bleu_bleu": 0.10394231994441043, + "eval_bleu_brevity_penalty": 0.965117992700678, + "eval_bleu_length_ratio": 0.9657124631209633, + "eval_bleu_precisions": [ + 0.39645559278428916, + 0.15827047540321446, + 0.06951617599730273, + 0.030843783399642992 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230109, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.925686105904255, + "eval_chrf_word_order": 2, + "eval_loss": 2.026986837387085, + "eval_meteor": 0.31400676467454897, + "eval_runtime": 946.0458, + "eval_samples_per_second": 18.179, + "eval_scarebleu_bp": 0.9890141193449017, + "eval_scarebleu_counts": [ + 104872, + 40555, + 17113, + 7351 + ], + "eval_scarebleu_precisions": [ + 42.295965283043216, + 17.575069446551073, + 8.012454349658208, + 3.740966921119593 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.083391545921348, + "eval_scarebleu_sys_len": 247948, + "eval_scarebleu_totals": [ + 247948, + 230753, + 213580, + 196500 + ], + "eval_steps_per_second": 0.569, + "eval_ter_num_edits": 154933, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 70.95008906941919, + "step": 243000 + }, + { + "epoch": 95.38, + "learning_rate": 2.637258191867351e-05, + "loss": 1.6717, + "step": 243500 + }, + { + "epoch": 95.38, + "eval_bleu_bleu": 0.10394574622405782, + "eval_bleu_brevity_penalty": 0.9646922823154045, + "eval_bleu_length_ratio": 0.9653011805488524, + "eval_bleu_precisions": [ + 0.39629843790079605, + 0.15804732726862641, + 0.06957179510769011, + 0.030933491593368754 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230011, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.923106143283874, + "eval_chrf_word_order": 2, + "eval_loss": 2.0284321308135986, + "eval_meteor": 0.313784105242856, + "eval_runtime": 933.2832, + "eval_samples_per_second": 18.427, + "eval_scarebleu_bp": 0.9899573682059217, + "eval_scarebleu_counts": [ + 104889, + 40551, + 17165, + 7364 + ], + "eval_scarebleu_precisions": [ + 42.2629360711091, + 17.55553342828817, + 8.028043196625088, + 3.7431062088596336 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.096796615519237, + "eval_scarebleu_sys_len": 248182, + "eval_scarebleu_totals": [ + 248182, + 230987, + 213813, + 196735 + ], + "eval_steps_per_second": 0.576, + "eval_ter_num_edits": 155022, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 70.99084577023295, + "step": 243500 + }, + { + "epoch": 95.57, + "learning_rate": 2.6323332017370704e-05, + "loss": 1.6722, + "step": 244000 + }, + { + "epoch": 95.57, + "eval_bleu_bleu": 0.10490422330543905, + "eval_bleu_brevity_penalty": 0.9672959323467853, + "eval_bleu_length_ratio": 0.9678192371127964, + "eval_bleu_precisions": [ + 0.39656391065473895, + 0.15856355662180904, + 0.07011322062225483, + 0.031377472726765436 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230611, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.976660035427074, + "eval_chrf_word_order": 2, + "eval_loss": 2.023160457611084, + "eval_meteor": 0.3147771888988531, + "eval_runtime": 950.9938, + "eval_samples_per_second": 18.084, + "eval_scarebleu_bp": 0.9882112617372042, + "eval_scarebleu_counts": [ + 104892, + 40586, + 17243, + 7450 + ], + "eval_scarebleu_precisions": [ + 42.3380114551421, + 17.60368503691109, + 8.080850684925087, + 3.7951727440372487 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.150816657276733, + "eval_scarebleu_sys_len": 247749, + "eval_scarebleu_totals": [ + 247749, + 230554, + 213381, + 196302 + ], + "eval_steps_per_second": 0.566, + "eval_ter_num_edits": 154882, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 70.92673410603153, + "step": 244000 + }, + { + "epoch": 95.77, + "learning_rate": 2.6273983418870908e-05, + "loss": 1.6923, + "step": 244500 + }, + { + "epoch": 95.77, + "eval_bleu_bleu": 0.10431387639210105, + "eval_bleu_brevity_penalty": 0.9640620838555775, + "eval_bleu_length_ratio": 0.9646926502125659, + "eval_bleu_precisions": [ + 0.39627870150435474, + 0.15842310423141848, + 0.06999166278790235, + 0.031194840271434897 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229866, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.97006211277896, + "eval_chrf_word_order": 2, + "eval_loss": 2.0251972675323486, + "eval_meteor": 0.31328597149400317, + "eval_runtime": 947.978, + "eval_samples_per_second": 18.142, + "eval_scarebleu_bp": 0.9877510460903308, + "eval_scarebleu_counts": [ + 104724, + 40540, + 17196, + 7423 + ], + "eval_scarebleu_precisions": [ + 42.28966018535344, + 17.592431869467106, + 8.063132130146718, + 3.78365428725801 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.123871447032334, + "eval_scarebleu_sys_len": 247635, + "eval_scarebleu_totals": [ + 247635, + 230440, + 213267, + 196186 + ], + "eval_steps_per_second": 0.568, + "eval_ter_num_edits": 155047, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 71.0022942816975, + "step": 244500 + }, + { + "epoch": 95.97, + "learning_rate": 2.6224634820371104e-05, + "loss": 1.6808, + "step": 245000 + }, + { + "epoch": 95.97, + "eval_bleu_bleu": 0.10486831250636391, + "eval_bleu_brevity_penalty": 0.9629746350011407, + "eval_bleu_length_ratio": 0.9636434599775893, + "eval_bleu_precisions": [ + 0.3973068078879521, + 0.15927332984968529, + 0.07062890504967735, + 0.03146778592029807 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229616, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 35.030167546116644, + "eval_chrf_word_order": 2, + "eval_loss": 2.024559736251831, + "eval_meteor": 0.314521940114719, + "eval_runtime": 939.6957, + "eval_samples_per_second": 18.302, + "eval_scarebleu_bp": 0.9871492206006546, + "eval_scarebleu_counts": [ + 104907, + 40713, + 17342, + 7477 + ], + "eval_scarebleu_precisions": [ + 42.389064431927466, + 17.678936649717098, + 8.137276063026118, + 3.8140370028412716 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.190633862896481, + "eval_scarebleu_sys_len": 247486, + "eval_scarebleu_totals": [ + 247486, + 230291, + 213118, + 196039 + ], + "eval_steps_per_second": 0.573, + "eval_ter_num_edits": 154817, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 70.89696797622373, + "step": 245000 + }, + { + "epoch": 96.16, + "learning_rate": 2.6175286221871297e-05, + "loss": 1.6632, + "step": 245500 + }, + { + "epoch": 96.16, + "eval_bleu_bleu": 0.10420031493904251, + "eval_bleu_brevity_penalty": 0.9627831260665745, + "eval_bleu_length_ratio": 0.9634588024962334, + "eval_bleu_precisions": [ + 0.3964638544770268, + 0.15852940761005194, + 0.07004036554380788, + 0.031167387900116184 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229572, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.97477216631844, + "eval_chrf_word_order": 2, + "eval_loss": 2.0253052711486816, + "eval_meteor": 0.3133309739882684, + "eval_runtime": 935.99, + "eval_samples_per_second": 18.374, + "eval_scarebleu_bp": 0.9865389519288192, + "eval_scarebleu_counts": [ + 104688, + 40511, + 17205, + 7412 + ], + "eval_scarebleu_precisions": [ + 42.32639941779368, + 17.60276353523942, + 8.078716420853935, + 3.783814137742678 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.1193777544559, + "eval_scarebleu_sys_len": 247335, + "eval_scarebleu_totals": [ + 247335, + 230140, + 212967, + 195887 + ], + "eval_steps_per_second": 0.575, + "eval_ter_num_edits": 154932, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 70.9496311289606, + "step": 245500 + }, + { + "epoch": 96.36, + "learning_rate": 2.6126036320568498e-05, + "loss": 1.6693, + "step": 246000 + }, + { + "epoch": 96.36, + "eval_bleu_bleu": 0.10446599247526588, + "eval_bleu_brevity_penalty": 0.9669708340980812, + "eval_bleu_length_ratio": 0.9675044800423034, + "eval_bleu_precisions": [ + 0.3967449769233439, + 0.15816462845866477, + 0.069788305578069, + 0.03110590074247753 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230536, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.97620251163994, + "eval_chrf_word_order": 2, + "eval_loss": 2.0225656032562256, + "eval_meteor": 0.31454960166116264, + "eval_runtime": 923.9386, + "eval_samples_per_second": 18.614, + "eval_scarebleu_bp": 0.9912378088935376, + "eval_scarebleu_counts": [ + 105163, + 40621, + 17217, + 7410 + ], + "eval_scarebleu_precisions": [ + 42.31911468812877, + 17.561661010354293, + 8.04036762370874, + 3.760466886577011 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.136202620723923, + "eval_scarebleu_sys_len": 248500, + "eval_scarebleu_totals": [ + 248500, + 231305, + 214132, + 197050 + ], + "eval_steps_per_second": 0.582, + "eval_ter_num_edits": 154884, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 70.9276499869487, + "step": 246000 + }, + { + "epoch": 96.55, + "learning_rate": 2.6076687722068694e-05, + "loss": 1.6711, + "step": 246500 + }, + { + "epoch": 96.55, + "eval_bleu_bleu": 0.10420167513750495, + "eval_bleu_brevity_penalty": 0.9645315094470411, + "eval_bleu_length_ratio": 0.9651459003940759, + "eval_bleu_precisions": [ + 0.39638393905398, + 0.15858237890017343, + 0.06988656405118164, + 0.03100762170365517 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229974, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 35.00263679732417, + "eval_chrf_word_order": 2, + "eval_loss": 2.023848533630371, + "eval_meteor": 0.3140325365847866, + "eval_runtime": 934.9737, + "eval_samples_per_second": 18.394, + "eval_scarebleu_bp": 0.9889455584100092, + "eval_scarebleu_counts": [ + 104900, + 40624, + 17237, + 7407 + ], + "eval_scarebleu_precisions": [ + 42.31015887484824, + 17.60626863601692, + 8.071154647574721, + 3.769772602349301 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.1342540943147, + "eval_scarebleu_sys_len": 247931, + "eval_scarebleu_totals": [ + 247931, + 230736, + 213563, + 196484 + ], + "eval_steps_per_second": 0.575, + "eval_ter_num_edits": 154959, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 70.96199552134232, + "step": 246500 + }, + { + "epoch": 96.75, + "learning_rate": 2.6027339123568894e-05, + "loss": 1.6793, + "step": 247000 + }, + { + "epoch": 96.75, + "eval_bleu_bleu": 0.10420184355941192, + "eval_bleu_brevity_penalty": 0.9624740258114518, + "eval_bleu_length_ratio": 0.9631608324695, + "eval_bleu_precisions": [ + 0.3972967438050379, + 0.15890271589121363, + 0.07016321197058598, + 0.031016282987085905 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229501, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 35.002871557044436, + "eval_chrf_word_order": 2, + "eval_loss": 2.020578384399414, + "eval_meteor": 0.3135920925758619, + "eval_runtime": 931.6626, + "eval_samples_per_second": 18.459, + "eval_scarebleu_bp": 0.98608606486081, + "eval_scarebleu_counts": [ + 104868, + 40591, + 17237, + 7396 + ], + "eval_scarebleu_precisions": [ + 42.418383402838735, + 17.646112647156, + 8.09796294208291, + 3.7777482658930013 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.130195813816442, + "eval_scarebleu_sys_len": 247223, + "eval_scarebleu_totals": [ + 247223, + 230028, + 212856, + 195778 + ], + "eval_steps_per_second": 0.577, + "eval_ter_num_edits": 154824, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 70.9001735594338, + "step": 247000 + }, + { + "epoch": 96.94, + "learning_rate": 2.597799052506909e-05, + "loss": 1.6761, + "step": 247500 + }, + { + "epoch": 96.94, + "eval_bleu_bleu": 0.10468825445727727, + "eval_bleu_brevity_penalty": 0.9677465661456955, + "eval_bleu_length_ratio": 0.9682557002505466, + "eval_bleu_precisions": [ + 0.39685326051622133, + 0.15853784188834769, + 0.07004517236286598, + 0.031074501843166343 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230715, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 35.04131199588771, + "eval_chrf_word_order": 2, + "eval_loss": 2.021780490875244, + "eval_meteor": 0.31460894582990867, + "eval_runtime": 930.6543, + "eval_samples_per_second": 18.479, + "eval_scarebleu_bp": 0.9899533391006791, + "eval_scarebleu_counts": [ + 105084, + 40651, + 17271, + 7437 + ], + "eval_scarebleu_precisions": [ + 42.341678049488074, + 17.598902097962647, + 8.077581449297053, + 3.7802503901226534 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.158461201962936, + "eval_scarebleu_sys_len": 248181, + "eval_scarebleu_totals": [ + 248181, + 230986, + 213814, + 196733 + ], + "eval_steps_per_second": 0.578, + "eval_ter_num_edits": 154879, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 70.9253602846558, + "step": 247500 + }, + { + "epoch": 97.14, + "learning_rate": 2.5928641926569287e-05, + "loss": 1.6669, + "step": 248000 + }, + { + "epoch": 97.14, + "eval_bleu_bleu": 0.10442249327344132, + "eval_bleu_brevity_penalty": 0.9650658742929654, + "eval_bleu_length_ratio": 0.9656621019896844, + "eval_bleu_precisions": [ + 0.3964979986701261, + 0.15859409493569812, + 0.07003167467048126, + 0.03112618360083272 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230097, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 35.02961857740174, + "eval_chrf_word_order": 2, + "eval_loss": 2.0227203369140625, + "eval_meteor": 0.3139866840412079, + "eval_runtime": 931.2998, + "eval_samples_per_second": 18.467, + "eval_scarebleu_bp": 0.9886188218682643, + "eval_scarebleu_counts": [ + 104955, + 40651, + 17241, + 7436 + ], + "eval_scarebleu_precisions": [ + 42.346177123260034, + 17.624157291192475, + 8.076128554765997, + 3.786131435175992 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.150922319495198, + "eval_scarebleu_sys_len": 247850, + "eval_scarebleu_totals": [ + 247850, + 230655, + 213481, + 196401 + ], + "eval_steps_per_second": 0.578, + "eval_ter_num_edits": 154919, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 70.94367790299904, + "step": 248000 + }, + { + "epoch": 97.34, + "learning_rate": 2.5879392025266484e-05, + "loss": 1.6583, + "step": 248500 + }, + { + "epoch": 97.34, + "eval_bleu_bleu": 0.10427035974134839, + "eval_bleu_brevity_penalty": 0.9690150842128333, + "eval_bleu_length_ratio": 0.9694853512059393, + "eval_bleu_precisions": [ + 0.3963455811054163, + 0.15835800442442696, + 0.06942212639586681, + 0.030768716800855245 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 231008, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 35.025217483136444, + "eval_chrf_word_order": 2, + "eval_loss": 2.024049997329712, + "eval_meteor": 0.31499291543599744, + "eval_runtime": 935.8047, + "eval_samples_per_second": 18.378, + "eval_scarebleu_bp": 0.9925126075828865, + "eval_scarebleu_counts": [ + 105213, + 40729, + 17203, + 7384 + ], + "eval_scarebleu_precisions": [ + 42.285294011261286, + 17.584253654661474, + 8.021991345221219, + 3.7412915157196056 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.130823679505802, + "eval_scarebleu_sys_len": 248817, + "eval_scarebleu_totals": [ + 248817, + 231622, + 214448, + 197365 + ], + "eval_steps_per_second": 0.575, + "eval_ter_num_edits": 154892, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 70.93131351061734, + "step": 248500 + }, + { + "epoch": 97.53, + "learning_rate": 2.583004342676668e-05, + "loss": 1.6666, + "step": 249000 + }, + { + "epoch": 97.53, + "eval_bleu_bleu": 0.10465743196274642, + "eval_bleu_brevity_penalty": 0.9681970035138047, + "eval_bleu_length_ratio": 0.9686921633882969, + "eval_bleu_precisions": [ + 0.3968390817047123, + 0.1582687338501292, + 0.06982994253370864, + 0.03112964088043654 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230819, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 35.024549828480545, + "eval_chrf_word_order": 2, + "eval_loss": 2.020779609680176, + "eval_meteor": 0.3150331985504469, + "eval_runtime": 946.0667, + "eval_samples_per_second": 18.178, + "eval_scarebleu_bp": 0.989421356116444, + "eval_scarebleu_counts": [ + 105097, + 40622, + 17212, + 7408 + ], + "eval_scarebleu_precisions": [ + 42.3694511971425, + 17.5964029213269, + 8.05496017446486, + 3.768056968463886 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.135164803257126, + "eval_scarebleu_sys_len": 248049, + "eval_scarebleu_totals": [ + 248049, + 230854, + 213682, + 196600 + ], + "eval_steps_per_second": 0.569, + "eval_ter_num_edits": 154870, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 70.92123882052856, + "step": 249000 + }, + { + "epoch": 97.73, + "learning_rate": 2.5780694828266877e-05, + "loss": 1.67, + "step": 249500 + }, + { + "epoch": 97.73, + "eval_bleu_bleu": 0.1046065082979423, + "eval_bleu_brevity_penalty": 0.9663073166513073, + "eval_bleu_length_ratio": 0.9668623756184976, + "eval_bleu_precisions": [ + 0.39667857437397724, + 0.15864870442989287, + 0.07015834472626359, + 0.03110420775621721 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230383, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 35.012703447815085, + "eval_chrf_word_order": 2, + "eval_loss": 2.02087664604187, + "eval_meteor": 0.31402701984313763, + "eval_runtime": 945.9233, + "eval_samples_per_second": 18.181, + "eval_scarebleu_bp": 0.9871573011634718, + "eval_scarebleu_counts": [ + 104845, + 40589, + 17249, + 7415 + ], + "eval_scarebleu_precisions": [ + 42.36367015774502, + 17.62493866509186, + 8.093524335940616, + 3.782314174369019 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.137814035519849, + "eval_scarebleu_sys_len": 247488, + "eval_scarebleu_totals": [ + 247488, + 230293, + 213121, + 196044 + ], + "eval_steps_per_second": 0.569, + "eval_ter_num_edits": 154887, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 70.92902380832444, + "step": 249500 + }, + { + "epoch": 97.92, + "learning_rate": 2.5731346229767077e-05, + "loss": 1.6689, + "step": 250000 + }, + { + "epoch": 97.92, + "eval_bleu_bleu": 0.10447460987417191, + "eval_bleu_brevity_penalty": 0.9640794737780265, + "eval_bleu_length_ratio": 0.9647094372563255, + "eval_bleu_precisions": [ + 0.397011354243703, + 0.1587680733513577, + 0.07015282636715153, + 0.031187489143772867 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229870, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 35.06886740401126, + "eval_chrf_word_order": 2, + "eval_loss": 2.020782232284546, + "eval_meteor": 0.3138732467019054, + "eval_runtime": 943.4427, + "eval_samples_per_second": 18.229, + "eval_scarebleu_bp": 0.9878963999540928, + "eval_scarebleu_counts": [ + 104948, + 40643, + 17271, + 7446 + ], + "eval_scarebleu_precisions": [ + 42.37395577197169, + 17.634374077995105, + 8.096894573003787, + 3.794623518919608 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.160402836516107, + "eval_scarebleu_sys_len": 247671, + "eval_scarebleu_totals": [ + 247671, + 230476, + 213304, + 196225 + ], + "eval_steps_per_second": 0.57, + "eval_ter_num_edits": 154760, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 70.87086537008457, + "step": 250000 + }, + { + "epoch": 98.12, + "learning_rate": 2.568209632846427e-05, + "loss": 1.6641, + "step": 250500 + }, + { + "epoch": 98.12, + "eval_bleu_bleu": 0.1048751606326541, + "eval_bleu_brevity_penalty": 0.9666803265440513, + "eval_bleu_length_ratio": 0.9672232970593296, + "eval_bleu_precisions": [ + 0.3964177394790623, + 0.15869257387210817, + 0.07024011666743153, + 0.03135191886699727 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230469, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 35.0741539238474, + "eval_chrf_word_order": 2, + "eval_loss": 2.0243330001831055, + "eval_meteor": 0.3140838305431777, + "eval_runtime": 953.7599, + "eval_samples_per_second": 18.032, + "eval_scarebleu_bp": 0.9884977815438599, + "eval_scarebleu_counts": [ + 104862, + 40649, + 17293, + 7467 + ], + "eval_scarebleu_precisions": [ + 42.31377612783472, + 17.62558265582656, + 8.101587242096583, + 3.802496295277816 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.17003266145472, + "eval_scarebleu_sys_len": 247820, + "eval_scarebleu_totals": [ + 247820, + 230625, + 213452, + 196371 + ], + "eval_steps_per_second": 0.564, + "eval_ter_num_edits": 154958, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 70.96153758088374, + "step": 250500 + }, + { + "epoch": 98.32, + "learning_rate": 2.5632747729964467e-05, + "loss": 1.6542, + "step": 251000 + }, + { + "epoch": 98.32, + "eval_bleu_bleu": 0.10434191762876502, + "eval_bleu_brevity_penalty": 0.965834355036198, + "eval_bleu_length_ratio": 0.9664049286760479, + "eval_bleu_precisions": [ + 0.3971659848701981, + 0.15866885052022958, + 0.0699312477988577, + 0.030909334853922787 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230274, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 34.99073198254644, + "eval_chrf_word_order": 2, + "eval_loss": 2.0206620693206787, + "eval_meteor": 0.31456207887364085, + "eval_runtime": 959.9715, + "eval_samples_per_second": 17.915, + "eval_scarebleu_bp": 0.9873633337385181, + "eval_scarebleu_counts": [ + 104975, + 40574, + 17202, + 7387 + ], + "eval_scarebleu_precisions": [ + 42.40745902665842, + 17.614524363560587, + 8.06954008969283, + 3.7669940539934115 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.120379492491315, + "eval_scarebleu_sys_len": 247539, + "eval_scarebleu_totals": [ + 247539, + 230344, + 213172, + 196098 + ], + "eval_steps_per_second": 0.56, + "eval_ter_num_edits": 154834, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 70.90475296401961, + "step": 251000 + }, + { + "epoch": 98.51, + "learning_rate": 2.558339913146467e-05, + "loss": 1.6584, + "step": 251500 + }, + { + "epoch": 98.51, + "eval_bleu_bleu": 0.10478661538788085, + "eval_bleu_brevity_penalty": 0.963662035165984, + "eval_bleu_length_ratio": 0.9643065482060945, + "eval_bleu_precisions": [ + 0.39739483144307014, + 0.15909379571829768, + 0.07044898627557339, + 0.03138875185002467 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229774, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 35.012984104276974, + "eval_chrf_word_order": 2, + "eval_loss": 2.018900156021118, + "eval_meteor": 0.31444099856952057, + "eval_runtime": 959.5808, + "eval_samples_per_second": 17.922, + "eval_scarebleu_bp": 0.987238103246631, + "eval_scarebleu_counts": [ + 104954, + 40642, + 17288, + 7449 + ], + "eval_scarebleu_precisions": [ + 42.4042859220712, + 17.646420306278845, + 8.111062629902271, + 3.799211494030102 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.16553769183433, + "eval_scarebleu_sys_len": 247508, + "eval_scarebleu_totals": [ + 247508, + 230313, + 213141, + 196067 + ], + "eval_steps_per_second": 0.561, + "eval_ter_num_edits": 154669, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 70.82919278835365, + "step": 251500 + }, + { + "epoch": 98.71, + "learning_rate": 2.5534050532964863e-05, + "loss": 1.6645, + "step": 252000 + }, + { + "epoch": 98.71, + "eval_bleu_bleu": 0.10475264921909212, + "eval_bleu_brevity_penalty": 0.9648573744460076, + "eval_bleu_length_ratio": 0.9654606574645689, + "eval_bleu_precisions": [ + 0.39698933705427975, + 0.15909966455880556, + 0.0703196860372422, + 0.03128113839160761 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230049, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 35.015337547210876, + "eval_chrf_word_order": 2, + "eval_loss": 2.0223500728607178, + "eval_meteor": 0.3144240146222364, + "eval_runtime": 957.649, + "eval_samples_per_second": 17.959, + "eval_scarebleu_bp": 0.9867329844666088, + "eval_scarebleu_counts": [ + 104850, + 40609, + 17241, + 7411 + ], + "eval_scarebleu_precisions": [ + 42.38367228144214, + 17.641666811475837, + 8.093796211534398, + 3.782396112976819 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.137074398710276, + "eval_scarebleu_sys_len": 247383, + "eval_scarebleu_totals": [ + 247383, + 230188, + 213015, + 195934 + ], + "eval_steps_per_second": 0.562, + "eval_ter_num_edits": 154850, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 70.91208001135692, + "step": 252000 + }, + { + "epoch": 98.9, + "learning_rate": 2.5484800631662064e-05, + "loss": 1.6665, + "step": 252500 + }, + { + "epoch": 98.9, + "eval_bleu_bleu": 0.10516002290316409, + "eval_bleu_brevity_penalty": 0.9628484171706294, + "eval_bleu_length_ratio": 0.963521753910332, + "eval_bleu_precisions": [ + 0.39810616454764425, + 0.15969057214961016, + 0.07078317881473134, + 0.0316200653279305 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229587, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 35.08686092725171, + "eval_chrf_word_order": 2, + "eval_loss": 2.021747589111328, + "eval_meteor": 0.31461693526948886, + "eval_runtime": 946.1197, + "eval_samples_per_second": 18.177, + "eval_scarebleu_bp": 0.987779310976172, + "eval_scarebleu_counts": [ + 105150, + 40822, + 17386, + 7534 + ], + "eval_scarebleu_precisions": [ + 42.46048731636798, + 17.714268356715426, + 8.151992985516216, + 3.8401353782793297 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.236002503602768, + "eval_scarebleu_sys_len": 247642, + "eval_scarebleu_totals": [ + 247642, + 230447, + 213273, + 196191 + ], + "eval_steps_per_second": 0.569, + "eval_ter_num_edits": 154591, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 70.79347343258429, + "step": 252500 + }, + { + "epoch": 99.1, + "learning_rate": 2.543545203316226e-05, + "loss": 1.6604, + "step": 253000 + }, + { + "epoch": 99.1, + "eval_bleu_bleu": 0.10540424343941981, + "eval_bleu_brevity_penalty": 0.9643055162420654, + "eval_bleu_length_ratio": 0.9649276688252008, + "eval_bleu_precisions": [ + 0.3974217343272936, + 0.15937798210852408, + 0.07070758720841046, + 0.03187335801791406 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229922, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 35.02587936633585, + "eval_chrf_word_order": 2, + "eval_loss": 2.021120548248291, + "eval_meteor": 0.31450789304623356, + "eval_runtime": 961.514, + "eval_samples_per_second": 17.886, + "eval_scarebleu_bp": 0.9895060085092922, + "eval_scarebleu_counts": [ + 105194, + 40845, + 17424, + 7593 + ], + "eval_scarebleu_precisions": [ + 42.404966340145926, + 17.69139144558744, + 8.153409888536373, + 3.86174416771352 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.267153739186144, + "eval_scarebleu_sys_len": 248070, + "eval_scarebleu_totals": [ + 248070, + 230875, + 213702, + 196621 + ], + "eval_steps_per_second": 0.56, + "eval_ter_num_edits": 154646, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 70.81866015780628, + "step": 253000 + }, + { + "epoch": 99.29, + "learning_rate": 2.5386103434662457e-05, + "loss": 1.6541, + "step": 253500 + }, + { + "epoch": 99.29, + "eval_bleu_bleu": 0.10505343370338718, + "eval_bleu_brevity_penalty": 0.9664201012659354, + "eval_bleu_length_ratio": 0.9669714914029353, + "eval_bleu_precisions": [ + 0.39774053964905887, + 0.15907022990985584, + 0.07031807887703262, + 0.03138494885560577 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230409, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 35.066014431036976, + "eval_chrf_word_order": 2, + "eval_loss": 2.0218863487243652, + "eval_meteor": 0.31545141432171575, + "eval_runtime": 945.2131, + "eval_samples_per_second": 18.195, + "eval_scarebleu_bp": 0.9883888328681568, + "eval_scarebleu_counts": [ + 105232, + 40742, + 17315, + 7471 + ], + "eval_scarebleu_precisions": [ + 42.467704898847025, + 17.66797630508504, + 8.112920229588848, + 3.805017672883583 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.193340473081223, + "eval_scarebleu_sys_len": 247793, + "eval_scarebleu_totals": [ + 247793, + 230598, + 213425, + 196346 + ], + "eval_steps_per_second": 0.569, + "eval_ter_num_edits": 154735, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 70.85941685862004, + "step": 253500 + }, + { + "epoch": 99.49, + "learning_rate": 2.533675483616265e-05, + "loss": 1.6534, + "step": 254000 + }, + { + "epoch": 99.49, + "eval_bleu_bleu": 0.10410331681996535, + "eval_bleu_brevity_penalty": 0.9651918226243615, + "eval_bleu_length_ratio": 0.9657838080569416, + "eval_bleu_precisions": [ + 0.396982522618044, + 0.15868051152720836, + 0.06965827246258365, + 0.030841539838854074 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230126, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 35.07173709836242, + "eval_chrf_word_order": 2, + "eval_loss": 2.022385358810425, + "eval_meteor": 0.3144050553025139, + "eval_runtime": 958.2862, + "eval_samples_per_second": 17.947, + "eval_scarebleu_bp": 0.9866602266178838, + "eval_scarebleu_counts": [ + 104860, + 40554, + 17164, + 7365 + ], + "eval_scarebleu_precisions": [ + 42.3907990216886, + 17.619151062258332, + 8.058329460039344, + 3.759187423438138 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.100867808708387, + "eval_scarebleu_sys_len": 247365, + "eval_scarebleu_totals": [ + 247365, + 230170, + 212997, + 195920 + ], + "eval_steps_per_second": 0.561, + "eval_ter_num_edits": 154957, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 70.96107964042515, + "step": 254000 + }, + { + "epoch": 99.69, + "learning_rate": 2.528750493485985e-05, + "loss": 1.6604, + "step": 254500 + }, + { + "epoch": 99.69, + "eval_bleu_bleu": 0.10483283767978054, + "eval_bleu_brevity_penalty": 0.9679588159113904, + "eval_bleu_length_ratio": 0.968461341536602, + "eval_bleu_precisions": [ + 0.39664332391534207, + 0.1588011368691149, + 0.0700582460999552, + 0.031178041559571136 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230764, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 35.12402048395441, + "eval_chrf_word_order": 2, + "eval_loss": 2.021698474884033, + "eval_meteor": 0.3151833719412797, + "eval_runtime": 937.731, + "eval_samples_per_second": 18.34, + "eval_scarebleu_bp": 0.990332004757377, + "eval_scarebleu_counts": [ + 105153, + 40775, + 17319, + 7462 + ], + "eval_scarebleu_precisions": [ + 42.3534387272178, + 17.645404189025445, + 8.096509230646964, + 3.7911850628731107 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.187905729518066, + "eval_scarebleu_sys_len": 248275, + "eval_scarebleu_totals": [ + 248275, + 231080, + 213907, + 196825 + ], + "eval_steps_per_second": 0.574, + "eval_ter_num_edits": 154910, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 70.93955643887182, + "step": 254500 + }, + { + "epoch": 99.88, + "learning_rate": 2.5238156336360047e-05, + "loss": 1.6608, + "step": 255000 + }, + { + "epoch": 99.88, + "eval_bleu_bleu": 0.10442735663530449, + "eval_bleu_brevity_penalty": 0.9657909532392998, + "eval_bleu_length_ratio": 0.9663629610666488, + "eval_bleu_precisions": [ + 0.39779123093492685, + 0.15911277567360807, + 0.0699723336702296, + 0.030862989572558775 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230264, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 35.09146892458418, + "eval_chrf_word_order": 2, + "eval_loss": 2.018340587615967, + "eval_meteor": 0.31554605094167654, + "eval_runtime": 958.6659, + "eval_samples_per_second": 17.94, + "eval_scarebleu_bp": 0.9881628278383284, + "eval_scarebleu_counts": [ + 105202, + 40742, + 17258, + 7405 + ], + "eval_scarebleu_precisions": [ + 42.465194944638874, + 17.672267959851133, + 8.088335231453492, + 3.7725179328333875 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.155770142923448, + "eval_scarebleu_sys_len": 247737, + "eval_scarebleu_totals": [ + 247737, + 230542, + 213369, + 196288 + ], + "eval_steps_per_second": 0.561, + "eval_ter_num_edits": 154718, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 70.85163187082415, + "step": 255000 + }, + { + "epoch": 100.08, + "learning_rate": 2.5188807737860247e-05, + "loss": 1.6536, + "step": 255500 + }, + { + "epoch": 100.08, + "eval_bleu_bleu": 0.10459393634732266, + "eval_bleu_brevity_penalty": 0.966532873589009, + "eval_bleu_length_ratio": 0.9670806071873728, + "eval_bleu_precisions": [ + 0.3966367956256645, + 0.15898987056837366, + 0.06991024071807425, + 0.03110686596510043 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230435, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 35.172805782224536, + "eval_chrf_word_order": 2, + "eval_loss": 2.0238609313964844, + "eval_meteor": 0.31511617734435327, + "eval_runtime": 958.4235, + "eval_samples_per_second": 17.944, + "eval_scarebleu_bp": 0.9884816417396324, + "eval_scarebleu_counts": [ + 104965, + 40708, + 17251, + 7419 + ], + "eval_scarebleu_precisions": [ + 42.356022210026794, + 17.65147146183565, + 8.082024277462063, + 3.778110486433635 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.150421101989723, + "eval_scarebleu_sys_len": 247816, + "eval_scarebleu_totals": [ + 247816, + 230621, + 213449, + 196368 + ], + "eval_steps_per_second": 0.561, + "eval_ter_num_edits": 154902, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 70.93589291520317, + "step": 255500 + }, + { + "epoch": 100.27, + "learning_rate": 2.5139459139360444e-05, + "loss": 1.6433, + "step": 256000 + }, + { + "epoch": 100.27, + "eval_bleu_bleu": 0.10406379292413416, + "eval_bleu_brevity_penalty": 0.9632966385825339, + "eval_bleu_length_ratio": 0.9639540202871424, + "eval_bleu_precisions": [ + 0.3973137707344682, + 0.1587896185792607, + 0.06978815771959823, + 0.030932923511826305 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229690, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 35.06685732581369, + "eval_chrf_word_order": 2, + "eval_loss": 2.0234251022338867, + "eval_meteor": 0.31443086683640625, + "eval_runtime": 953.7931, + "eval_samples_per_second": 18.031, + "eval_scarebleu_bp": 0.9854913434991063, + "eval_scarebleu_counts": [ + 104819, + 40531, + 17154, + 7350 + ], + "eval_scarebleu_precisions": [ + 42.42378863183798, + 17.631296192377796, + 8.064614704734682, + 3.757073265484509 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.091621902758021, + "eval_scarebleu_sys_len": 247076, + "eval_scarebleu_totals": [ + 247076, + 229881, + 212707, + 195631 + ], + "eval_steps_per_second": 0.564, + "eval_ter_num_edits": 154822, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 70.89925767851663, + "step": 256000 + }, + { + "epoch": 100.47, + "learning_rate": 2.5090209238057638e-05, + "loss": 1.651, + "step": 256500 + }, + { + "epoch": 100.47, + "eval_bleu_bleu": 0.10468324656406536, + "eval_bleu_brevity_penalty": 0.9678375356698804, + "eval_bleu_length_ratio": 0.9683438322302846, + "eval_bleu_precisions": [ + 0.3968734831149019, + 0.15903269161425676, + 0.07007877624389573, + 0.0309438170918723 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230736, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 35.1364212226323, + "eval_chrf_word_order": 2, + "eval_loss": 2.021488666534424, + "eval_meteor": 0.3154136932688246, + "eval_runtime": 959.6057, + "eval_samples_per_second": 17.922, + "eval_scarebleu_bp": 0.9891633241344326, + "eval_scarebleu_counts": [ + 105103, + 40765, + 17278, + 7400 + ], + "eval_scarebleu_precisions": [ + 42.38280541161764, + 17.663243641405607, + 8.088345442288967, + 3.7652709723049056 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.154777888311573, + "eval_scarebleu_sys_len": 247985, + "eval_scarebleu_totals": [ + 247985, + 230790, + 213616, + 196533 + ], + "eval_steps_per_second": 0.561, + "eval_ter_num_edits": 154858, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 70.91574353502558, + "step": 256500 + }, + { + "epoch": 100.67, + "learning_rate": 2.504086063955784e-05, + "loss": 1.659, + "step": 257000 + }, + { + "epoch": 100.67, + "eval_bleu_bleu": 0.10418184176298918, + "eval_bleu_brevity_penalty": 0.9654653817674756, + "eval_bleu_length_ratio": 0.9660482039961558, + "eval_bleu_precisions": [ + 0.3965958408090743, + 0.15870400105167282, + 0.06982040637079931, + 0.030853390460955022 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230189, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 35.10213202786547, + "eval_chrf_word_order": 2, + "eval_loss": 2.0166726112365723, + "eval_meteor": 0.3142077233613374, + "eval_runtime": 940.372, + "eval_samples_per_second": 18.289, + "eval_scarebleu_bp": 0.9880659530859204, + "eval_scarebleu_counts": [ + 104936, + 40619, + 17224, + 7393 + ], + "eval_scarebleu_precisions": [ + 42.361926907348426, + 17.620749789604282, + 8.073346332683366, + 3.7668458461773624 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.128129205964598, + "eval_scarebleu_sys_len": 247713, + "eval_scarebleu_totals": [ + 247713, + 230518, + 213344, + 196265 + ], + "eval_steps_per_second": 0.572, + "eval_ter_num_edits": 155020, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 70.98992988931579, + "step": 257000 + }, + { + "epoch": 100.86, + "learning_rate": 2.4991512041058034e-05, + "loss": 1.6567, + "step": 257500 + }, + { + "epoch": 100.86, + "eval_bleu_bleu": 0.10471670776396615, + "eval_bleu_brevity_penalty": 0.9664895010731387, + "eval_bleu_length_ratio": 0.9670386395779738, + "eval_bleu_precisions": [ + 0.39739177606596504, + 0.1590911222623458, + 0.07020559298607108, + 0.0310483713291362 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230425, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 35.1553506577894, + "eval_chrf_word_order": 2, + "eval_loss": 2.0172877311706543, + "eval_meteor": 0.31556011758902747, + "eval_runtime": 951.9222, + "eval_samples_per_second": 18.067, + "eval_scarebleu_bp": 0.9894979466821237, + "eval_scarebleu_counts": [ + 105252, + 40781, + 17302, + 7417 + ], + "eval_scarebleu_precisions": [ + 42.428688907880094, + 17.6638238338827, + 8.096396817969115, + 3.772346972509727 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.171016065845025, + "eval_scarebleu_sys_len": 248068, + "eval_scarebleu_totals": [ + 248068, + 230873, + 213700, + 196615 + ], + "eval_steps_per_second": 0.565, + "eval_ter_num_edits": 154706, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 70.84613658532118, + "step": 257500 + }, + { + "epoch": 101.06, + "learning_rate": 2.4942163442558234e-05, + "loss": 1.6571, + "step": 258000 + }, + { + "epoch": 101.06, + "eval_bleu_bleu": 0.10439067383292906, + "eval_bleu_brevity_penalty": 0.9640533887850271, + "eval_bleu_length_ratio": 0.9646842566906861, + "eval_bleu_precisions": [ + 0.3973001426930707, + 0.15926157549995534, + 0.07013012255252982, + 0.03098190620814865 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 229864, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 35.029022548930186, + "eval_chrf_word_order": 2, + "eval_loss": 2.018538475036621, + "eval_meteor": 0.31449389694172775, + "eval_runtime": 957.9577, + "eval_samples_per_second": 17.953, + "eval_scarebleu_bp": 0.9872340632955491, + "eval_scarebleu_counts": [ + 105021, + 40680, + 17250, + 7401 + ], + "eval_scarebleu_precisions": [ + 42.43152718913, + 17.66299628330265, + 8.093347971736621, + 3.7748840910134196 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.14412840241598, + "eval_scarebleu_sys_len": 247507, + "eval_scarebleu_totals": [ + 247507, + 230312, + 213138, + 196059 + ], + "eval_steps_per_second": 0.562, + "eval_ter_num_edits": 154833, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 70.90429502356103, + "step": 258000 + }, + { + "epoch": 101.25, + "learning_rate": 2.489291354125543e-05, + "loss": 1.6366, + "step": 258500 + }, + { + "epoch": 101.25, + "eval_bleu_bleu": 0.10505565143329842, + "eval_bleu_brevity_penalty": 0.9673089341508212, + "eval_bleu_length_ratio": 0.967831827395616, + "eval_bleu_precisions": [ + 0.3975430806455809, + 0.15932508352114855, + 0.07035636763851665, + 0.0312208786487135 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230614, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 35.09412027845024, + "eval_chrf_word_order": 2, + "eval_loss": 2.017908811569214, + "eval_meteor": 0.31601148802667317, + "eval_runtime": 956.8426, + "eval_samples_per_second": 17.974, + "eval_scarebleu_bp": 0.990319921876342, + "eval_scarebleu_counts": [ + 105386, + 40864, + 17349, + 7474 + ], + "eval_scarebleu_precisions": [ + 42.44779918798737, + 17.684148573852006, + 8.11064776722268, + 3.7973783152118687 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.211533373837815, + "eval_scarebleu_sys_len": 248272, + "eval_scarebleu_totals": [ + 248272, + 231077, + 213904, + 196820 + ], + "eval_steps_per_second": 0.562, + "eval_ter_num_edits": 154731, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 70.85758509678571, + "step": 258500 + }, + { + "epoch": 101.45, + "learning_rate": 2.4843564942755628e-05, + "loss": 1.6454, + "step": 259000 + }, + { + "epoch": 101.45, + "eval_bleu_bleu": 0.10486618742886442, + "eval_bleu_brevity_penalty": 0.9659732285613912, + "eval_bleu_length_ratio": 0.9665392250261249, + "eval_bleu_precisions": [ + 0.3971108004133631, + 0.15923626654654147, + 0.07020740196378632, + 0.031285634432643934 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230306, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 35.15833566220728, + "eval_chrf_word_order": 2, + "eval_loss": 2.0210041999816895, + "eval_meteor": 0.3150299127730556, + "eval_runtime": 942.6537, + "eval_samples_per_second": 18.244, + "eval_scarebleu_bp": 0.989070577800767, + "eval_scarebleu_counts": [ + 105090, + 40763, + 17284, + 7438 + ], + "eval_scarebleu_precisions": [ + 42.38149393858736, + 17.66413741999506, + 8.091987602648015, + 3.7850105845953426 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.170965566914166, + "eval_scarebleu_sys_len": 247962, + "eval_scarebleu_totals": [ + 247962, + 230767, + 213594, + 196512 + ], + "eval_steps_per_second": 0.571, + "eval_ter_num_edits": 154824, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 70.9001735594338, + "step": 259000 + }, + { + "epoch": 101.65, + "learning_rate": 2.4794216344255824e-05, + "loss": 1.6522, + "step": 259500 + }, + { + "epoch": 101.65, + "eval_bleu_bleu": 0.10504254791477098, + "eval_bleu_brevity_penalty": 0.9656650777398963, + "eval_bleu_length_ratio": 0.9662412549993915, + "eval_bleu_precisions": [ + 0.3974417443047321, + 0.15957566654149455, + 0.07039585864670866, + 0.03135939160096181 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230235, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 35.10659216330975, + "eval_chrf_word_order": 2, + "eval_loss": 2.0195388793945312, + "eval_meteor": 0.31505741175600827, + "eval_runtime": 929.2671, + "eval_samples_per_second": 18.507, + "eval_scarebleu_bp": 0.9887519494981526, + "eval_scarebleu_counts": [ + 105212, + 40827, + 17352, + 7476 + ], + "eval_scarebleu_precisions": [ + 42.444217634932606, + 17.697929671244278, + 8.126829496756669, + 3.8057615850213042 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.20712196588634, + "eval_scarebleu_sys_len": 247883, + "eval_scarebleu_totals": [ + 247883, + 230688, + 213515, + 196439 + ], + "eval_steps_per_second": 0.579, + "eval_ter_num_edits": 154780, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 70.88002417925622, + "step": 259500 + }, + { + "epoch": 101.84, + "learning_rate": 2.4744867745756024e-05, + "loss": 1.6497, + "step": 260000 + }, + { + "epoch": 101.84, + "eval_bleu_bleu": 0.1046636975776612, + "eval_bleu_brevity_penalty": 0.9667670537598431, + "eval_bleu_length_ratio": 0.9673072322781278, + "eval_bleu_precisions": [ + 0.39735084971517076, + 0.15895430720039008, + 0.06991755510347676, + 0.03110743820111788 + ], + "eval_bleu_reference_length": 238279, + "eval_bleu_translation_length": 230489, + "eval_chrf_beta": 2, + "eval_chrf_char_order": 6, + "eval_chrf_score": 35.097739683308546, + "eval_chrf_word_order": 2, + "eval_loss": 2.0169615745544434, + "eval_meteor": 0.3151805622318303, + "eval_runtime": 937.2032, + "eval_samples_per_second": 18.35, + "eval_scarebleu_bp": 0.9869229386704703, + "eval_scarebleu_counts": [ + 104995, + 40630, + 17193, + 7380 + ], + "eval_scarebleu_precisions": [ + 42.434223820878636, + 17.64718657024345, + 8.06948212257465, + 3.765536665510133 + ], + "eval_scarebleu_ref_len": 250687, + "eval_scarebleu_score": 12.121303189280749, + "eval_scarebleu_sys_len": 247430, + "eval_scarebleu_totals": [ + 247430, + 230235, + 213062, + 195988 + ], + "eval_steps_per_second": 0.574, + "eval_ter_num_edits": 154751, + "eval_ter_ref_length": 218369.0, + "eval_ter_score": 70.86674390595735, + "step": 260000 + } + ], + "max_steps": 510600, + "num_train_epochs": 200, + "total_flos": 2.814895884337152e+17, + "trial_name": null, + "trial_params": null +}