diff --git "a/last-checkpoint/trainer_state.json" "b/last-checkpoint/trainer_state.json" new file mode 100644--- /dev/null +++ "b/last-checkpoint/trainer_state.json" @@ -0,0 +1,5666 @@ +{ + "best_metric": 2.768705023404105, + "best_model_checkpoint": "./results/R-facebook-bart-base-full-ft-without-tum-nlp-german-gpt2_easy-prior-pp-no_ls-f135/checkpoint-100", + "epoch": 0.12433944668946223, + "global_step": 100, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0, + "prior_loss": 1707.30078125, + "step": 0, + "translation_loss": 3.63191294670105, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0, + "prior_loss": 39218.515625, + "step": 0, + "translation_loss": 3.708862781524658, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0, + "prior_loss": 988.1674194335938, + "step": 0, + "translation_loss": 3.864363431930542, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0, + "prior_loss": 606.6981811523438, + "step": 0, + "translation_loss": 3.8811421394348145, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0, + "prior_loss": 1395.2628173828125, + "step": 0, + "translation_loss": 4.127743244171143, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0, + "prior_loss": 755.3653564453125, + "step": 0, + "translation_loss": 3.763817548751831, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0, + "prior_loss": 3561.888916015625, + "step": 0, + "translation_loss": 4.2197442054748535, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0, + "prior_loss": 1503.4136962890625, + "step": 0, + "translation_loss": 3.7694497108459473, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.0, + "learning_rate": 0.0, + "loss": 3.8709, + "step": 1 + }, + { + "epoch": 0.0, + "prior_loss": 3250.18994140625, + "step": 1, + "translation_loss": 3.739914655685425, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.0, + "prior_loss": 1696.839111328125, + "step": 1, + "translation_loss": 3.5914244651794434, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.0, + "prior_loss": 3932.857421875, + "step": 1, + "translation_loss": 3.195557117462158, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.0, + "prior_loss": 1521.7666015625, + "step": 1, + "translation_loss": 4.022922039031982, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.0, + "prior_loss": 901.2119140625, + "step": 1, + "translation_loss": 2.8743398189544678, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.0, + "prior_loss": 953.7800903320312, + "step": 1, + "translation_loss": 4.420579433441162, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.0, + "prior_loss": 304.9666748046875, + "step": 1, + "translation_loss": 2.8146350383758545, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.0, + "prior_loss": 145.98255920410156, + "step": 1, + "translation_loss": 3.868675708770752, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.0, + "prior_loss": 617.2018432617188, + "step": 2, + "translation_loss": 4.05088996887207, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.0, + "prior_loss": 552.3394165039062, + "step": 2, + "translation_loss": 3.995864152908325, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.0, + "prior_loss": 2125.571533203125, + "step": 2, + "translation_loss": 4.105653285980225, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.0, + "prior_loss": 4243.6416015625, + "step": 2, + "translation_loss": 3.1850550174713135, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.0, + "prior_loss": 1024.8260498046875, + "step": 2, + "translation_loss": 3.3498642444610596, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.0, + "prior_loss": 537.5435180664062, + "step": 2, + "translation_loss": 4.033816337585449, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.0, + "prior_loss": 2673.3076171875, + "step": 2, + "translation_loss": 3.5206034183502197, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.0, + "prior_loss": 3627.128662109375, + "step": 2, + "translation_loss": 3.726022720336914, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.0, + "prior_loss": 36791.86328125, + "step": 3, + "translation_loss": 3.0330393314361572, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.0, + "prior_loss": 4279.40185546875, + "step": 3, + "translation_loss": 3.8271069526672363, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.0, + "prior_loss": 158.74815368652344, + "step": 3, + "translation_loss": 3.806774377822876, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.0, + "prior_loss": 219.97286987304688, + "step": 3, + "translation_loss": 3.4123730659484863, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.0, + "prior_loss": 396.3480224609375, + "step": 3, + "translation_loss": 4.0942888259887695, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.0, + "prior_loss": 255.7657470703125, + "step": 3, + "translation_loss": 3.473695993423462, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.0, + "prior_loss": 1741.6966552734375, + "step": 3, + "translation_loss": 4.111321926116943, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.0, + "prior_loss": 85.11055755615234, + "step": 3, + "translation_loss": 3.2221126556396484, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.0, + "prior_loss": 243.43527221679688, + "step": 4, + "translation_loss": 4.165782451629639, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.0, + "prior_loss": 10596.53125, + "step": 4, + "translation_loss": 4.014073371887207, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.0, + "prior_loss": 618.0264892578125, + "step": 4, + "translation_loss": 3.6812007427215576, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.0, + "prior_loss": 5413.974609375, + "step": 4, + "translation_loss": 3.3860793113708496, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.0, + "prior_loss": 942.1473388671875, + "step": 4, + "translation_loss": 2.8515145778656006, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.0, + "prior_loss": 245.37696838378906, + "step": 4, + "translation_loss": 3.923508644104004, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.0, + "prior_loss": 269.5154724121094, + "step": 4, + "translation_loss": 3.9102890491485596, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.0, + "prior_loss": 39264.3984375, + "step": 4, + "translation_loss": 4.222975730895996, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 456.783447265625, + "step": 5, + "translation_loss": 3.9132275581359863, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 128.73046875, + "step": 5, + "translation_loss": 3.522397994995117, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 237.13902282714844, + "step": 5, + "translation_loss": 4.574235439300537, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 4196.478515625, + "step": 5, + "translation_loss": 3.601461410522461, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 2197.551025390625, + "step": 5, + "translation_loss": 3.6719412803649902, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 3294.934326171875, + "step": 5, + "translation_loss": 4.042680263519287, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 880.8514404296875, + "step": 5, + "translation_loss": 3.4600703716278076, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 2216.124267578125, + "step": 5, + "translation_loss": 3.4124064445495605, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 623.5685424804688, + "step": 6, + "translation_loss": 3.9444315433502197, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 140.0327606201172, + "step": 6, + "translation_loss": 3.5770418643951416, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 20332.64453125, + "step": 6, + "translation_loss": 3.60186505317688, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 9688.0546875, + "step": 6, + "translation_loss": 3.541936159133911, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 726.2144165039062, + "step": 6, + "translation_loss": 2.7987420558929443, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 893.1005859375, + "step": 6, + "translation_loss": 3.0670199394226074, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 280.3255310058594, + "step": 6, + "translation_loss": 3.5404295921325684, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 11438.3994140625, + "step": 6, + "translation_loss": 4.132778644561768, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 414.7995300292969, + "step": 7, + "translation_loss": 3.0746304988861084, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 155.2140350341797, + "step": 7, + "translation_loss": 3.8657822608947754, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 625.9691162109375, + "step": 7, + "translation_loss": 3.4460067749023438, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 1915.81884765625, + "step": 7, + "translation_loss": 3.3514318466186523, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 912.017822265625, + "step": 7, + "translation_loss": 3.850133180618286, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 24230.845703125, + "step": 7, + "translation_loss": 3.552932024002075, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 876.1869506835938, + "step": 7, + "translation_loss": 3.83473539352417, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 743.6853637695312, + "step": 7, + "translation_loss": 3.2140040397644043, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 1687.4359130859375, + "step": 8, + "translation_loss": 4.091519832611084, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 14299.7861328125, + "step": 8, + "translation_loss": 3.3910322189331055, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 2929.21875, + "step": 8, + "translation_loss": 3.72690749168396, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 1660.87158203125, + "step": 8, + "translation_loss": 3.1896567344665527, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 18120.87890625, + "step": 8, + "translation_loss": 3.4352285861968994, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 1275.152099609375, + "step": 8, + "translation_loss": 3.496962070465088, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 546.5042724609375, + "step": 8, + "translation_loss": 3.543036699295044, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 2017.75, + "step": 8, + "translation_loss": 4.179780960083008, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 636.9287719726562, + "step": 9, + "translation_loss": 3.3264081478118896, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 599.991455078125, + "step": 9, + "translation_loss": 4.529600620269775, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 10448.0478515625, + "step": 9, + "translation_loss": 3.546550989151001, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 159.4227294921875, + "step": 9, + "translation_loss": 3.29679012298584, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 1122.3275146484375, + "step": 9, + "translation_loss": 3.372741460800171, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 38187.1328125, + "step": 9, + "translation_loss": 3.9311227798461914, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 760.148193359375, + "step": 9, + "translation_loss": 2.8504717350006104, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 572.2559814453125, + "step": 9, + "translation_loss": 2.824134588241577, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 512.7816162109375, + "step": 10, + "translation_loss": 2.9327893257141113, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 1464.39013671875, + "step": 10, + "translation_loss": 2.926840305328369, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 340.7959899902344, + "step": 10, + "translation_loss": 3.5755770206451416, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 3358.572265625, + "step": 10, + "translation_loss": 3.696779489517212, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 1466.9263916015625, + "step": 10, + "translation_loss": 4.0555830001831055, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 235.8191375732422, + "step": 10, + "translation_loss": 3.148876428604126, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 506.189697265625, + "step": 10, + "translation_loss": 3.3211753368377686, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 2254.88818359375, + "step": 10, + "translation_loss": 3.4944634437561035, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 3171.561279296875, + "step": 11, + "translation_loss": 2.8429431915283203, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 371.9290466308594, + "step": 11, + "translation_loss": 3.5747230052948, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 17512.39453125, + "step": 11, + "translation_loss": 3.2137279510498047, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 171.3442840576172, + "step": 11, + "translation_loss": 3.13053297996521, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 2426.077880859375, + "step": 11, + "translation_loss": 4.03982400894165, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 119.39710998535156, + "step": 11, + "translation_loss": 3.3579041957855225, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 352.8841552734375, + "step": 11, + "translation_loss": 4.344560146331787, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 9906.693359375, + "step": 11, + "translation_loss": 3.40232515335083, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 314.6402893066406, + "step": 12, + "translation_loss": 2.91984224319458, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 191.6884307861328, + "step": 12, + "translation_loss": 3.214494228363037, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 5624.56103515625, + "step": 12, + "translation_loss": 3.323265314102173, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 211.53744506835938, + "step": 12, + "translation_loss": 3.1089541912078857, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 7255.69921875, + "step": 12, + "translation_loss": 3.474808692932129, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 641.6351318359375, + "step": 12, + "translation_loss": 3.4104371070861816, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 623.0465698242188, + "step": 12, + "translation_loss": 2.561013698577881, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.01, + "prior_loss": 2107.768798828125, + "step": 12, + "translation_loss": 3.0953125953674316, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 560.3124389648438, + "step": 13, + "translation_loss": 3.786608934402466, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 1204.8353271484375, + "step": 13, + "translation_loss": 3.914158344268799, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 8330.6328125, + "step": 13, + "translation_loss": 2.6290175914764404, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 1487.8218994140625, + "step": 13, + "translation_loss": 3.2710320949554443, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 19958.474609375, + "step": 13, + "translation_loss": 4.0989484786987305, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 9607.5478515625, + "step": 13, + "translation_loss": 3.7195749282836914, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 838.7387084960938, + "step": 13, + "translation_loss": 3.2072200775146484, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 124.06493377685547, + "step": 13, + "translation_loss": 3.525177001953125, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 21604.84375, + "step": 14, + "translation_loss": 3.0134358406066895, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 731.5599365234375, + "step": 14, + "translation_loss": 2.838172435760498, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 448.841552734375, + "step": 14, + "translation_loss": 3.3223793506622314, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 2801.52490234375, + "step": 14, + "translation_loss": 3.331775665283203, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 11140.0087890625, + "step": 14, + "translation_loss": 2.941495656967163, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 159.2047882080078, + "step": 14, + "translation_loss": 3.763871431350708, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 166874.734375, + "step": 14, + "translation_loss": 3.0975606441497803, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 8503.7265625, + "step": 14, + "translation_loss": 3.5133767127990723, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 728.7926025390625, + "step": 15, + "translation_loss": 3.7376301288604736, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 2872.240478515625, + "step": 15, + "translation_loss": 3.4173362255096436, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 499.7095031738281, + "step": 15, + "translation_loss": 3.314438819885254, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 1308.433837890625, + "step": 15, + "translation_loss": 2.7751779556274414, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 998.3282470703125, + "step": 15, + "translation_loss": 2.8526408672332764, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 3156.152099609375, + "step": 15, + "translation_loss": 3.1299033164978027, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 1018.6434326171875, + "step": 15, + "translation_loss": 3.4771840572357178, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 3111.285888671875, + "step": 15, + "translation_loss": 3.353817939758301, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 62854.953125, + "step": 16, + "translation_loss": 2.5362977981567383, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 393.0377502441406, + "step": 16, + "translation_loss": 2.861375570297241, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 68.56597900390625, + "step": 16, + "translation_loss": 3.6941072940826416, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 1348.2684326171875, + "step": 16, + "translation_loss": 2.8689870834350586, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 428.3122863769531, + "step": 16, + "translation_loss": 3.370063543319702, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 239.41685485839844, + "step": 16, + "translation_loss": 3.191861391067505, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 3063.4091796875, + "step": 16, + "translation_loss": 3.80499529838562, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 966.6638793945312, + "step": 16, + "translation_loss": 2.4742653369903564, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 589.40087890625, + "step": 17, + "translation_loss": 3.6053080558776855, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 335.44940185546875, + "step": 17, + "translation_loss": 3.3395421504974365, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 5277.89892578125, + "step": 17, + "translation_loss": 2.896674156188965, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 83549.59375, + "step": 17, + "translation_loss": 2.8455190658569336, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 490.16461181640625, + "step": 17, + "translation_loss": 3.152902364730835, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 1290.6361083984375, + "step": 17, + "translation_loss": 3.2821733951568604, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 300.3488464355469, + "step": 17, + "translation_loss": 2.860276222229004, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 442.4078674316406, + "step": 17, + "translation_loss": 3.2156078815460205, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 53.628028869628906, + "step": 18, + "translation_loss": 3.4492146968841553, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 683.1463623046875, + "step": 18, + "translation_loss": 3.0299715995788574, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 367.95684814453125, + "step": 18, + "translation_loss": 2.9418530464172363, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 523.6568603515625, + "step": 18, + "translation_loss": 3.0766870975494385, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 163.60134887695312, + "step": 18, + "translation_loss": 2.7210586071014404, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 15093.619140625, + "step": 18, + "translation_loss": 2.8328356742858887, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 9750.3515625, + "step": 18, + "translation_loss": 2.5910115242004395, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 600.3460693359375, + "step": 18, + "translation_loss": 3.4899864196777344, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 348.6884765625, + "step": 19, + "translation_loss": 2.680044174194336, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 472.7681579589844, + "step": 19, + "translation_loss": 3.3350231647491455, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 231.25038146972656, + "step": 19, + "translation_loss": 2.9491028785705566, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 479.041748046875, + "step": 19, + "translation_loss": 2.8961615562438965, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 428.0375061035156, + "step": 19, + "translation_loss": 3.234879970550537, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 4931.5068359375, + "step": 19, + "translation_loss": 3.0451297760009766, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 598.397705078125, + "step": 19, + "translation_loss": 2.787959575653076, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 2955.88916015625, + "step": 19, + "translation_loss": 2.7146799564361572, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "learning_rate": 9.5e-06, + "loss": 3.414, + "step": 20 + }, + { + "epoch": 0.02, + "prior_loss": 1020.8685913085938, + "step": 20, + "translation_loss": 2.9947245121002197, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 981.5440063476562, + "step": 20, + "translation_loss": 2.5459489822387695, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 365.3856201171875, + "step": 20, + "translation_loss": 3.35145902633667, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 2277.2412109375, + "step": 20, + "translation_loss": 2.841393232345581, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 1254.790283203125, + "step": 20, + "translation_loss": 3.753214120864868, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 299.60302734375, + "step": 20, + "translation_loss": 2.9088194370269775, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 7595.05126953125, + "step": 20, + "translation_loss": 2.800506114959717, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.02, + "prior_loss": 149.99600219726562, + "step": 20, + "translation_loss": 2.98956036567688, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 513.5338134765625, + "step": 21, + "translation_loss": 2.5187432765960693, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 6942.28662109375, + "step": 21, + "translation_loss": 2.931713581085205, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 81.0897445678711, + "step": 21, + "translation_loss": 2.4850518703460693, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 8532.556640625, + "step": 21, + "translation_loss": 3.012676477432251, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 1230.4041748046875, + "step": 21, + "translation_loss": 3.271296262741089, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 1129.050048828125, + "step": 21, + "translation_loss": 2.744448184967041, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 187.0287322998047, + "step": 21, + "translation_loss": 3.4022562503814697, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 203.87066650390625, + "step": 21, + "translation_loss": 2.5080387592315674, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 5926.03662109375, + "step": 22, + "translation_loss": 3.0145840644836426, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 104.25637817382812, + "step": 22, + "translation_loss": 2.995145320892334, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 1443.20556640625, + "step": 22, + "translation_loss": 3.0057859420776367, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 598.8372802734375, + "step": 22, + "translation_loss": 3.2452216148376465, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 459.9767761230469, + "step": 22, + "translation_loss": 2.880857229232788, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 219.27894592285156, + "step": 22, + "translation_loss": 2.8758561611175537, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 1517.6368408203125, + "step": 22, + "translation_loss": 3.287381172180176, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 3982.54638671875, + "step": 22, + "translation_loss": 2.970747470855713, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 305.5115966796875, + "step": 23, + "translation_loss": 2.8778929710388184, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 2409.3466796875, + "step": 23, + "translation_loss": 2.9992287158966064, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 332.14227294921875, + "step": 23, + "translation_loss": 3.041053295135498, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 6028.98681640625, + "step": 23, + "translation_loss": 2.8171188831329346, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 2901.39697265625, + "step": 23, + "translation_loss": 2.2492873668670654, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 1732.68994140625, + "step": 23, + "translation_loss": 3.1273019313812256, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 6598.60107421875, + "step": 23, + "translation_loss": 2.1542067527770996, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 1684.2982177734375, + "step": 23, + "translation_loss": 2.9402990341186523, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 1055.8057861328125, + "step": 24, + "translation_loss": 2.856578826904297, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 1307.119873046875, + "step": 24, + "translation_loss": 2.9279775619506836, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 80.20691680908203, + "step": 24, + "translation_loss": 2.915640115737915, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 14956.478515625, + "step": 24, + "translation_loss": 2.6688430309295654, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 3289.697265625, + "step": 24, + "translation_loss": 2.7132956981658936, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 258.2283020019531, + "step": 24, + "translation_loss": 3.1804656982421875, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 238.52711486816406, + "step": 24, + "translation_loss": 3.615835428237915, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 109.30924987792969, + "step": 24, + "translation_loss": 2.577155113220215, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 375.9421691894531, + "step": 25, + "translation_loss": 2.767167806625366, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 2038.2236328125, + "step": 25, + "translation_loss": 1.9460651874542236, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 362.8846130371094, + "step": 25, + "translation_loss": 2.741689920425415, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 183.02615356445312, + "step": 25, + "translation_loss": 3.0913331508636475, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 151.22125244140625, + "step": 25, + "translation_loss": 3.089398145675659, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 322.2772216796875, + "step": 25, + "translation_loss": 2.7948291301727295, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 28623.869140625, + "step": 25, + "translation_loss": 2.928835153579712, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 379.0719299316406, + "step": 25, + "translation_loss": 3.4467620849609375, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 28466.27734375, + "step": 26, + "translation_loss": 4.136862277984619, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 40781.3125, + "step": 26, + "translation_loss": 2.9517483711242676, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 366.0095520019531, + "step": 26, + "translation_loss": 2.70383882522583, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 1090.8385009765625, + "step": 26, + "translation_loss": 2.837846279144287, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 148.4166259765625, + "step": 26, + "translation_loss": 2.7511632442474365, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 12083.1669921875, + "step": 26, + "translation_loss": 2.484536647796631, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 1199.8822021484375, + "step": 26, + "translation_loss": 2.544184446334839, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 355.1436462402344, + "step": 26, + "translation_loss": 3.5038654804229736, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 3520.025634765625, + "step": 27, + "translation_loss": 3.265793800354004, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 6067.78369140625, + "step": 27, + "translation_loss": 2.3993661403656006, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 328.1143493652344, + "step": 27, + "translation_loss": 2.7988173961639404, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 322.1874694824219, + "step": 27, + "translation_loss": 2.740968704223633, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 8035.541015625, + "step": 27, + "translation_loss": 3.0941414833068848, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 5241.033203125, + "step": 27, + "translation_loss": 3.169420003890991, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 43852.6328125, + "step": 27, + "translation_loss": 2.577392578125, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 199.79193115234375, + "step": 27, + "translation_loss": 2.739144802093506, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 645.7705078125, + "step": 28, + "translation_loss": 2.480553150177002, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 329.97723388671875, + "step": 28, + "translation_loss": 2.5233798027038574, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 500.57281494140625, + "step": 28, + "translation_loss": 2.6270840167999268, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 301.4358215332031, + "step": 28, + "translation_loss": 3.2896862030029297, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 693.203857421875, + "step": 28, + "translation_loss": 2.257539987564087, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 13178815.0, + "step": 28, + "translation_loss": 3.0022170543670654, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 656.52978515625, + "step": 28, + "translation_loss": 2.183096408843994, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.03, + "prior_loss": 433.05621337890625, + "step": 28, + "translation_loss": 2.9882094860076904, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 652.662109375, + "step": 29, + "translation_loss": 2.7720041275024414, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 8348.12890625, + "step": 29, + "translation_loss": 2.1925418376922607, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 805.088623046875, + "step": 29, + "translation_loss": 2.4491355419158936, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 7292.2021484375, + "step": 29, + "translation_loss": 2.477199077606201, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 13745.92578125, + "step": 29, + "translation_loss": 2.8613715171813965, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 57543.56640625, + "step": 29, + "translation_loss": 3.0750174522399902, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 1479.178955078125, + "step": 29, + "translation_loss": 3.017627239227295, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 16355.853515625, + "step": 29, + "translation_loss": 2.003383159637451, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 12245006336.0, + "step": 30, + "translation_loss": 2.492370367050171, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 40915247104.0, + "step": 30, + "translation_loss": 2.625476837158203, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 3855.12353515625, + "step": 30, + "translation_loss": 3.125150442123413, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 193.48391723632812, + "step": 30, + "translation_loss": 2.9260799884796143, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 57.985862731933594, + "step": 30, + "translation_loss": 2.5323326587677, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 14548.0986328125, + "step": 30, + "translation_loss": 2.7247796058654785, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 27725.115234375, + "step": 30, + "translation_loss": 2.8669357299804688, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 25917.0625, + "step": 30, + "translation_loss": 2.3437907695770264, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 525.4873657226562, + "step": 31, + "translation_loss": 2.3366894721984863, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 26584530944.0, + "step": 31, + "translation_loss": 3.3513712882995605, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 9877.1943359375, + "step": 31, + "translation_loss": 5.080294609069824, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 16176393216.0, + "step": 31, + "translation_loss": 2.747060537338257, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 9965.2236328125, + "step": 31, + "translation_loss": 3.3197243213653564, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 82321629184.0, + "step": 31, + "translation_loss": 2.7262234687805176, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 346.38153076171875, + "step": 31, + "translation_loss": 2.492765426635742, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 15604.69140625, + "step": 31, + "translation_loss": 3.1473803520202637, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 139215.9375, + "step": 32, + "translation_loss": 2.6604092121124268, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 55725852.0, + "step": 32, + "translation_loss": 2.8472397327423096, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 17364074496.0, + "step": 32, + "translation_loss": 2.7783472537994385, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 1002.6069946289062, + "step": 32, + "translation_loss": 2.5269994735717773, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 15374271488.0, + "step": 32, + "translation_loss": 2.7640295028686523, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 1337.924072265625, + "step": 32, + "translation_loss": 2.4041330814361572, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 22898378752.0, + "step": 32, + "translation_loss": 2.287308931350708, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 36251529216.0, + "step": 32, + "translation_loss": 3.8761184215545654, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 5636.20751953125, + "step": 33, + "translation_loss": 3.0656135082244873, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 14812418048.0, + "step": 33, + "translation_loss": 2.8658864498138428, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 358.64459228515625, + "step": 33, + "translation_loss": 2.9616079330444336, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 47690739712.0, + "step": 33, + "translation_loss": 2.677978277206421, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 19993.794921875, + "step": 33, + "translation_loss": 2.039472818374634, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 13169613824.0, + "step": 33, + "translation_loss": 3.08607816696167, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 13662558208.0, + "step": 33, + "translation_loss": 2.810093402862549, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 1880.5291748046875, + "step": 33, + "translation_loss": 2.7712759971618652, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 2421.1396484375, + "step": 34, + "translation_loss": 2.9306511878967285, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 1956.8223876953125, + "step": 34, + "translation_loss": 2.625603199005127, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 0, + "step": 34, + "translation_loss": 2.562358856201172, + "weighted_prior_loss": 0 + }, + { + "epoch": 0.04, + "prior_loss": 16129163264.0, + "step": 34, + "translation_loss": 3.0476839542388916, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 52701319168.0, + "step": 34, + "translation_loss": 2.2823283672332764, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 1091.2962646484375, + "step": 34, + "translation_loss": 2.118896722793579, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 737.7269897460938, + "step": 34, + "translation_loss": 3.3296959400177, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 13673430016.0, + "step": 34, + "translation_loss": 2.213545083999634, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 10710700032.0, + "step": 35, + "translation_loss": 3.694119691848755, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 14446014464.0, + "step": 35, + "translation_loss": 2.295588731765747, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 30189346.0, + "step": 35, + "translation_loss": 3.5995895862579346, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 6051.93701171875, + "step": 35, + "translation_loss": 2.7716684341430664, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 0, + "step": 35, + "translation_loss": 2.54858136177063, + "weighted_prior_loss": 0 + }, + { + "epoch": 0.04, + "prior_loss": 35988770816.0, + "step": 35, + "translation_loss": 1.8845468759536743, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 47525388288.0, + "step": 35, + "translation_loss": 3.323378324508667, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 12017743872.0, + "step": 35, + "translation_loss": 2.659670352935791, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 0, + "step": 36, + "translation_loss": 2.799809455871582, + "weighted_prior_loss": 0 + }, + { + "epoch": 0.04, + "prior_loss": 25985150976.0, + "step": 36, + "translation_loss": 2.7681009769439697, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 523.900146484375, + "step": 36, + "translation_loss": 2.3618335723876953, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 253.7380828857422, + "step": 36, + "translation_loss": 3.235590696334839, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 47242231808.0, + "step": 36, + "translation_loss": 2.0832972526550293, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.04, + "prior_loss": 0, + "step": 36, + "translation_loss": 2.4478816986083984, + "weighted_prior_loss": 0 + }, + { + "epoch": 0.04, + "prior_loss": 0, + "step": 36, + "translation_loss": 1.8477418422698975, + "weighted_prior_loss": 0 + }, + { + "epoch": 0.04, + "prior_loss": 38111465472.0, + "step": 36, + "translation_loss": 2.8331663608551025, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 17751996416.0, + "step": 37, + "translation_loss": 1.9484083652496338, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 3915.66845703125, + "step": 37, + "translation_loss": 2.350802183151245, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 22008727552.0, + "step": 37, + "translation_loss": 3.0715744495391846, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 5709.49072265625, + "step": 37, + "translation_loss": 2.822971820831299, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 3579.5966796875, + "step": 37, + "translation_loss": 2.615558624267578, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 1263.0809326171875, + "step": 37, + "translation_loss": 2.9781241416931152, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 34523230208.0, + "step": 37, + "translation_loss": 1.9737215042114258, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 22843152384.0, + "step": 37, + "translation_loss": 3.0372390747070312, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 14194191360.0, + "step": 38, + "translation_loss": 2.690642833709717, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 2409.46484375, + "step": 38, + "translation_loss": 2.713493824005127, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 24129800192.0, + "step": 38, + "translation_loss": 2.5938901901245117, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 2921.53271484375, + "step": 38, + "translation_loss": 2.6513009071350098, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 2638.1806640625, + "step": 38, + "translation_loss": 2.399062156677246, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 4398.1484375, + "step": 38, + "translation_loss": 2.760399103164673, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 151.13351440429688, + "step": 38, + "translation_loss": 2.44891619682312, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 18875.84375, + "step": 38, + "translation_loss": 2.5314810276031494, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 4661.501953125, + "step": 39, + "translation_loss": 3.1465070247650146, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 14345524.0, + "step": 39, + "translation_loss": 2.1863112449645996, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 1539.2913818359375, + "step": 39, + "translation_loss": 1.9646087884902954, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 2691.621826171875, + "step": 39, + "translation_loss": 2.46647572517395, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 314.5055847167969, + "step": 39, + "translation_loss": 2.122422695159912, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 868.9664306640625, + "step": 39, + "translation_loss": 3.3733091354370117, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 6626.126953125, + "step": 39, + "translation_loss": 3.0756776332855225, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 9165.3564453125, + "step": 39, + "translation_loss": 2.182021379470825, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "learning_rate": 1.9500000000000003e-05, + "loss": 2.7896, + "step": 40 + }, + { + "epoch": 0.05, + "prior_loss": 76.98571014404297, + "step": 40, + "translation_loss": 2.6163418292999268, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 985.2423095703125, + "step": 40, + "translation_loss": 2.470874309539795, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 2903.302734375, + "step": 40, + "translation_loss": 2.84169340133667, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 439.15093994140625, + "step": 40, + "translation_loss": 2.4668946266174316, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 172.56846618652344, + "step": 40, + "translation_loss": 2.0735769271850586, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 35898208256.0, + "step": 40, + "translation_loss": 1.6733388900756836, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 2401.779296875, + "step": 40, + "translation_loss": 2.9737958908081055, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 390.3286437988281, + "step": 40, + "translation_loss": 2.832522392272949, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 4907.1064453125, + "step": 41, + "translation_loss": 2.9739532470703125, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 1897.729248046875, + "step": 41, + "translation_loss": 2.1625614166259766, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 428.0180969238281, + "step": 41, + "translation_loss": 3.2574875354766846, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 457.0503234863281, + "step": 41, + "translation_loss": 2.99595308303833, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 12948.0, + "step": 41, + "translation_loss": 3.1333811283111572, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 1127.4000244140625, + "step": 41, + "translation_loss": 2.446340560913086, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 663.6466064453125, + "step": 41, + "translation_loss": 2.691795825958252, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 5347.06396484375, + "step": 41, + "translation_loss": 2.348083734512329, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 234895.203125, + "step": 42, + "translation_loss": 2.3153810501098633, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 7594.95068359375, + "step": 42, + "translation_loss": 2.605010509490967, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 226.57870483398438, + "step": 42, + "translation_loss": 1.9035507440567017, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 519.949462890625, + "step": 42, + "translation_loss": 2.7312638759613037, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 6483.45654296875, + "step": 42, + "translation_loss": 2.98213791847229, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 564.8464965820312, + "step": 42, + "translation_loss": 2.448457717895508, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 1918074.125, + "step": 42, + "translation_loss": 1.7959768772125244, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 175.01817321777344, + "step": 42, + "translation_loss": 2.630247116088867, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 3255.54736328125, + "step": 43, + "translation_loss": 2.3548145294189453, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 8582.19140625, + "step": 43, + "translation_loss": 1.9305567741394043, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 1393.3333740234375, + "step": 43, + "translation_loss": 2.5797741413116455, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 1696.06591796875, + "step": 43, + "translation_loss": 2.5442497730255127, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 270.8102722167969, + "step": 43, + "translation_loss": 3.2501094341278076, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 2494.85205078125, + "step": 43, + "translation_loss": 2.317167282104492, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 1442.7603759765625, + "step": 43, + "translation_loss": 1.5417113304138184, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 475.7865905761719, + "step": 43, + "translation_loss": 2.4731340408325195, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 22286.021484375, + "step": 44, + "translation_loss": 2.96799635887146, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 234.29615783691406, + "step": 44, + "translation_loss": 2.6808528900146484, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 3613.149658203125, + "step": 44, + "translation_loss": 2.2219057083129883, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 9577.12109375, + "step": 44, + "translation_loss": 3.3466384410858154, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 1192.7283935546875, + "step": 44, + "translation_loss": 3.4438979625701904, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 10000.802734375, + "step": 44, + "translation_loss": 2.8795738220214844, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 45959820.0, + "step": 44, + "translation_loss": 2.5401434898376465, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.05, + "prior_loss": 820.991455078125, + "step": 44, + "translation_loss": 2.4504175186157227, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 121.32227325439453, + "step": 45, + "translation_loss": 2.8191728591918945, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 22358.189453125, + "step": 45, + "translation_loss": 2.108431100845337, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 65746064.0, + "step": 45, + "translation_loss": 2.197628974914551, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 354.31146240234375, + "step": 45, + "translation_loss": 2.973529100418091, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 202188.0, + "step": 45, + "translation_loss": 2.542868137359619, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 2741.616943359375, + "step": 45, + "translation_loss": 2.9235246181488037, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 949.3787231445312, + "step": 45, + "translation_loss": 2.6596457958221436, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 8397.0283203125, + "step": 45, + "translation_loss": 2.0661890506744385, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 1981.2894287109375, + "step": 46, + "translation_loss": 2.732029676437378, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 14846.9658203125, + "step": 46, + "translation_loss": 2.7421414852142334, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 1143.88623046875, + "step": 46, + "translation_loss": 2.244983673095703, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 574331.75, + "step": 46, + "translation_loss": 1.5182671546936035, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 14222.6171875, + "step": 46, + "translation_loss": 2.4449033737182617, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 27825472.0, + "step": 46, + "translation_loss": 2.0374045372009277, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 9751.587890625, + "step": 46, + "translation_loss": 2.1189324855804443, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 762.0808715820312, + "step": 46, + "translation_loss": 3.0398406982421875, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 223.2962188720703, + "step": 47, + "translation_loss": 2.288409948348999, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 167.9105987548828, + "step": 47, + "translation_loss": 2.3043253421783447, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 298069.65625, + "step": 47, + "translation_loss": 2.050784111022949, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 9243971.0, + "step": 47, + "translation_loss": 2.5102121829986572, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 113545.875, + "step": 47, + "translation_loss": 2.7656450271606445, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 23854378.0, + "step": 47, + "translation_loss": 2.3364858627319336, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 8095.6611328125, + "step": 47, + "translation_loss": 2.5964560508728027, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 2516574.0, + "step": 47, + "translation_loss": 2.553652286529541, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 1587.36328125, + "step": 48, + "translation_loss": 3.7713305950164795, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 280592.21875, + "step": 48, + "translation_loss": 1.9616296291351318, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 10837.490234375, + "step": 48, + "translation_loss": 2.871818780899048, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 498.154052734375, + "step": 48, + "translation_loss": 2.291963577270508, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 460.2354431152344, + "step": 48, + "translation_loss": 2.2709977626800537, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 27024.681640625, + "step": 48, + "translation_loss": 2.0999999046325684, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 50871.16015625, + "step": 48, + "translation_loss": 2.195446729660034, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 4193024.5, + "step": 48, + "translation_loss": 1.969450831413269, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 1048.3634033203125, + "step": 49, + "translation_loss": 2.3302605152130127, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 50.07112503051758, + "step": 49, + "translation_loss": 2.6747918128967285, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 8083.83447265625, + "step": 49, + "translation_loss": 2.0269784927368164, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 1603.566162109375, + "step": 49, + "translation_loss": 1.9423367977142334, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 7355128.0, + "step": 49, + "translation_loss": 2.770983934402466, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 13955.748046875, + "step": 49, + "translation_loss": 2.624398946762085, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 31127108.0, + "step": 49, + "translation_loss": 2.556025743484497, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 103483.2421875, + "step": 49, + "translation_loss": 2.349360466003418, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 25704.142578125, + "step": 50, + "translation_loss": 3.076753854751587, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 5162.2978515625, + "step": 50, + "translation_loss": 2.448409080505371, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 284410.03125, + "step": 50, + "translation_loss": 2.621201515197754, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 1343.4205322265625, + "step": 50, + "translation_loss": 2.534526824951172, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 682190.6875, + "step": 50, + "translation_loss": 2.9573075771331787, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 96847.0625, + "step": 50, + "translation_loss": 2.31215763092041, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 1285467.875, + "step": 50, + "translation_loss": 2.9680416584014893, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 197915.5625, + "step": 50, + "translation_loss": 3.4877026081085205, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 13308.048828125, + "step": 51, + "translation_loss": 2.826706647872925, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 1114650.375, + "step": 51, + "translation_loss": 3.4060773849487305, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 2143.52099609375, + "step": 51, + "translation_loss": 3.0055246353149414, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 423.56622314453125, + "step": 51, + "translation_loss": 3.302173614501953, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 170.89102172851562, + "step": 51, + "translation_loss": 2.8849403858184814, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 2299.9013671875, + "step": 51, + "translation_loss": 3.333608388900757, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 368.6335144042969, + "step": 51, + "translation_loss": 3.1823103427886963, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 5171.28564453125, + "step": 51, + "translation_loss": 2.2719979286193848, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 1076.5777587890625, + "step": 52, + "translation_loss": 2.6052849292755127, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 338.74310302734375, + "step": 52, + "translation_loss": 2.2007763385772705, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 508.402587890625, + "step": 52, + "translation_loss": 2.7329719066619873, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 2741.454833984375, + "step": 52, + "translation_loss": 3.0290117263793945, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 402162.15625, + "step": 52, + "translation_loss": 2.684215784072876, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 1598.4033203125, + "step": 52, + "translation_loss": 3.162764072418213, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 1018.390869140625, + "step": 52, + "translation_loss": 3.168086528778076, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.06, + "prior_loss": 2406.908447265625, + "step": 52, + "translation_loss": 2.38944149017334, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 105452.3359375, + "step": 53, + "translation_loss": 2.4552831649780273, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 1295.001220703125, + "step": 53, + "translation_loss": 2.982226848602295, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 939.3258666992188, + "step": 53, + "translation_loss": 2.8451178073883057, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 2445.1640625, + "step": 53, + "translation_loss": 2.8071141242980957, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 14559.3125, + "step": 53, + "translation_loss": 3.623149871826172, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 319.066162109375, + "step": 53, + "translation_loss": 3.0006134510040283, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 1379.8277587890625, + "step": 53, + "translation_loss": 2.8986988067626953, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 10742.4921875, + "step": 53, + "translation_loss": 2.7171807289123535, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 1333.9495849609375, + "step": 54, + "translation_loss": 2.9156908988952637, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 360.90771484375, + "step": 54, + "translation_loss": 2.562307596206665, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 864.2555541992188, + "step": 54, + "translation_loss": 3.8982090950012207, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 4670.05419921875, + "step": 54, + "translation_loss": 2.800447940826416, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 19635.708984375, + "step": 54, + "translation_loss": 3.1964821815490723, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 29674.1015625, + "step": 54, + "translation_loss": 2.597818374633789, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 1672.700927734375, + "step": 54, + "translation_loss": 3.0512094497680664, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 425.2651672363281, + "step": 54, + "translation_loss": 3.2743723392486572, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 327.1317138671875, + "step": 55, + "translation_loss": 2.7382936477661133, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 775.9862060546875, + "step": 55, + "translation_loss": 2.853137493133545, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 1286.1187744140625, + "step": 55, + "translation_loss": 2.961862325668335, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 22289.974609375, + "step": 55, + "translation_loss": 3.234513521194458, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 3523.508544921875, + "step": 55, + "translation_loss": 3.1312496662139893, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 15226.2099609375, + "step": 55, + "translation_loss": 3.188460350036621, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 1063.158447265625, + "step": 55, + "translation_loss": 2.9478611946105957, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 1843.249267578125, + "step": 55, + "translation_loss": 2.363640069961548, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 1734.0313720703125, + "step": 56, + "translation_loss": 2.3438127040863037, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 3470.052734375, + "step": 56, + "translation_loss": 2.893730640411377, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 396.44708251953125, + "step": 56, + "translation_loss": 2.3154115676879883, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 1427.71435546875, + "step": 56, + "translation_loss": 2.501102924346924, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 2979.94482421875, + "step": 56, + "translation_loss": 2.9242613315582275, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 1899.927490234375, + "step": 56, + "translation_loss": 2.5775182247161865, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 4155.44677734375, + "step": 56, + "translation_loss": 2.9709055423736572, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 511.8208312988281, + "step": 56, + "translation_loss": 3.238539695739746, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 6326.81982421875, + "step": 57, + "translation_loss": 2.5065226554870605, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 420.17242431640625, + "step": 57, + "translation_loss": 2.7858145236968994, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 1938.2623291015625, + "step": 57, + "translation_loss": 2.0948009490966797, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 827.8141479492188, + "step": 57, + "translation_loss": 2.103266954421997, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 3891.8232421875, + "step": 57, + "translation_loss": 3.138779878616333, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 38623.48828125, + "step": 57, + "translation_loss": 1.8779627084732056, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 268.7166442871094, + "step": 57, + "translation_loss": 3.1711933612823486, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 141.6114959716797, + "step": 57, + "translation_loss": 2.6696200370788574, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 2868.2509765625, + "step": 58, + "translation_loss": 2.3951127529144287, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 964.9115600585938, + "step": 58, + "translation_loss": 3.463649034500122, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 66155.0390625, + "step": 58, + "translation_loss": 2.0380427837371826, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 530.3189086914062, + "step": 58, + "translation_loss": 2.6590616703033447, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 6231.04296875, + "step": 58, + "translation_loss": 2.750983715057373, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 2858.968505859375, + "step": 58, + "translation_loss": 1.880813717842102, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 1050.8629150390625, + "step": 58, + "translation_loss": 2.5398638248443604, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 1887.497802734375, + "step": 58, + "translation_loss": 3.0179660320281982, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 1121.892578125, + "step": 59, + "translation_loss": 2.681673526763916, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 4379.73583984375, + "step": 59, + "translation_loss": 2.9715397357940674, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 1801.1446533203125, + "step": 59, + "translation_loss": 2.6668550968170166, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 785.70556640625, + "step": 59, + "translation_loss": 3.1077988147735596, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 1406.0972900390625, + "step": 59, + "translation_loss": 3.107808828353882, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 402.9769592285156, + "step": 59, + "translation_loss": 3.033113718032837, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 456.53369140625, + "step": 59, + "translation_loss": 2.247234344482422, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 3509.835205078125, + "step": 59, + "translation_loss": 2.172299861907959, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "learning_rate": 2.95e-05, + "loss": 2.6541, + "step": 60 + }, + { + "epoch": 0.07, + "prior_loss": 1488.8494873046875, + "step": 60, + "translation_loss": 1.9694535732269287, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 3986.6044921875, + "step": 60, + "translation_loss": 2.9307076930999756, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 1812.448974609375, + "step": 60, + "translation_loss": 2.1896629333496094, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 3012.5810546875, + "step": 60, + "translation_loss": 2.2703053951263428, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 824.6669921875, + "step": 60, + "translation_loss": 2.4586219787597656, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 973.5126953125, + "step": 60, + "translation_loss": 2.4691367149353027, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 13692.4775390625, + "step": 60, + "translation_loss": 2.7337493896484375, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.07, + "prior_loss": 1012.3287353515625, + "step": 60, + "translation_loss": 2.5207948684692383, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 3078.262939453125, + "step": 61, + "translation_loss": 2.9145758152008057, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 11592.6513671875, + "step": 61, + "translation_loss": 2.5432181358337402, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 1083.3583984375, + "step": 61, + "translation_loss": 2.3098082542419434, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 330.4187316894531, + "step": 61, + "translation_loss": 2.444812059402466, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 2116.526611328125, + "step": 61, + "translation_loss": 3.2120442390441895, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 922.4248657226562, + "step": 61, + "translation_loss": 2.9775850772857666, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 1302.0716552734375, + "step": 61, + "translation_loss": 2.4831020832061768, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 8592.5185546875, + "step": 61, + "translation_loss": 3.23799467086792, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 25193.76171875, + "step": 62, + "translation_loss": 2.580779790878296, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 526.3593139648438, + "step": 62, + "translation_loss": 3.043778657913208, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 759.1275024414062, + "step": 62, + "translation_loss": 3.5782365798950195, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 423.222412109375, + "step": 62, + "translation_loss": 2.426790714263916, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 556.0695190429688, + "step": 62, + "translation_loss": 2.2685203552246094, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 10489.3505859375, + "step": 62, + "translation_loss": 2.372356653213501, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 250.6095733642578, + "step": 62, + "translation_loss": 3.356727123260498, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 20675.30078125, + "step": 62, + "translation_loss": 2.5946810245513916, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 21586.7421875, + "step": 63, + "translation_loss": 2.4179224967956543, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 2204.508544921875, + "step": 63, + "translation_loss": 3.8794829845428467, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 149.90806579589844, + "step": 63, + "translation_loss": 2.4135215282440186, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 3129.796630859375, + "step": 63, + "translation_loss": 2.2095530033111572, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 4266.69140625, + "step": 63, + "translation_loss": 2.6105570793151855, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 1177.2962646484375, + "step": 63, + "translation_loss": 2.5985214710235596, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 1030.196533203125, + "step": 63, + "translation_loss": 3.161301612854004, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 30405.509765625, + "step": 63, + "translation_loss": 2.9744057655334473, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 866.0244750976562, + "step": 64, + "translation_loss": 2.5853524208068848, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 3106.648681640625, + "step": 64, + "translation_loss": 2.972160577774048, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 315.9964904785156, + "step": 64, + "translation_loss": 1.8948419094085693, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 454.6532287597656, + "step": 64, + "translation_loss": 2.8570330142974854, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 17184.99609375, + "step": 64, + "translation_loss": 2.7472081184387207, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 692.9688720703125, + "step": 64, + "translation_loss": 2.0155811309814453, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 1198.6488037109375, + "step": 64, + "translation_loss": 2.6688177585601807, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 2907.89013671875, + "step": 64, + "translation_loss": 3.171980142593384, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 1548.4595947265625, + "step": 65, + "translation_loss": 3.20558500289917, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 1243.0909423828125, + "step": 65, + "translation_loss": 2.559492349624634, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 4188.8935546875, + "step": 65, + "translation_loss": 1.9733586311340332, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 1036.2816162109375, + "step": 65, + "translation_loss": 2.6448774337768555, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 286.09661865234375, + "step": 65, + "translation_loss": 2.681535005569458, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 2723.026123046875, + "step": 65, + "translation_loss": 2.304877758026123, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 2118.90283203125, + "step": 65, + "translation_loss": 2.351500988006592, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 484.2646179199219, + "step": 65, + "translation_loss": 2.2114596366882324, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 3661.3681640625, + "step": 66, + "translation_loss": 2.5295660495758057, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 3713.09033203125, + "step": 66, + "translation_loss": 2.9004740715026855, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 247.28192138671875, + "step": 66, + "translation_loss": 2.7497072219848633, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 8454.658203125, + "step": 66, + "translation_loss": 3.553863525390625, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 1585.9168701171875, + "step": 66, + "translation_loss": 2.6737060546875, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 111064.515625, + "step": 66, + "translation_loss": 2.418370008468628, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 461.54791259765625, + "step": 66, + "translation_loss": 2.4838836193084717, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 1431.2822265625, + "step": 66, + "translation_loss": 2.623168706893921, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 2453.043212890625, + "step": 67, + "translation_loss": 2.00156307220459, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 338279.71875, + "step": 67, + "translation_loss": 2.6246883869171143, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 702037.0625, + "step": 67, + "translation_loss": 3.9080350399017334, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 8693.6630859375, + "step": 67, + "translation_loss": 3.2071261405944824, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 17769.779296875, + "step": 67, + "translation_loss": 2.5544848442077637, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 1912.175537109375, + "step": 67, + "translation_loss": 2.998584270477295, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 8240.6875, + "step": 67, + "translation_loss": 1.921301245689392, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 150.49757385253906, + "step": 67, + "translation_loss": 2.665179491043091, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 7623.01806640625, + "step": 68, + "translation_loss": 3.623863935470581, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 10379.8486328125, + "step": 68, + "translation_loss": 2.894747734069824, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 1097.06884765625, + "step": 68, + "translation_loss": 2.398926258087158, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 1632.1011962890625, + "step": 68, + "translation_loss": 2.5676932334899902, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 331.02349853515625, + "step": 68, + "translation_loss": 2.236046075820923, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 354.36737060546875, + "step": 68, + "translation_loss": 2.3708512783050537, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 574.2796630859375, + "step": 68, + "translation_loss": 3.296247720718384, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.08, + "prior_loss": 2795.04541015625, + "step": 68, + "translation_loss": 2.9749019145965576, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 11074.26171875, + "step": 69, + "translation_loss": 2.5086441040039062, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 30702.28125, + "step": 69, + "translation_loss": 3.1352972984313965, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 2290.090576171875, + "step": 69, + "translation_loss": 2.643763780593872, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 271.05535888671875, + "step": 69, + "translation_loss": 2.4005539417266846, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 1460.2864990234375, + "step": 69, + "translation_loss": 2.7309627532958984, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 587.48974609375, + "step": 69, + "translation_loss": 2.6674814224243164, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 4464.2490234375, + "step": 69, + "translation_loss": 2.0719194412231445, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 2226.09228515625, + "step": 69, + "translation_loss": 2.606563091278076, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 90717.828125, + "step": 70, + "translation_loss": 2.1528208255767822, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 436.49163818359375, + "step": 70, + "translation_loss": 2.7763588428497314, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 2902.628662109375, + "step": 70, + "translation_loss": 3.044722318649292, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 2395.259033203125, + "step": 70, + "translation_loss": 2.342508316040039, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 7609.24658203125, + "step": 70, + "translation_loss": 2.6820712089538574, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 1053.940673828125, + "step": 70, + "translation_loss": 2.5480687618255615, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 247.20657348632812, + "step": 70, + "translation_loss": 2.5725159645080566, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 717.8414306640625, + "step": 70, + "translation_loss": 3.2339868545532227, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 1944.791015625, + "step": 71, + "translation_loss": 2.708977460861206, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 489.6543884277344, + "step": 71, + "translation_loss": 2.8784632682800293, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 242.41360473632812, + "step": 71, + "translation_loss": 2.869791269302368, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 247.6901092529297, + "step": 71, + "translation_loss": 2.740604877471924, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 288.69586181640625, + "step": 71, + "translation_loss": 2.1950271129608154, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 5581.33349609375, + "step": 71, + "translation_loss": 3.126006603240967, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 8802.0322265625, + "step": 71, + "translation_loss": 2.2969722747802734, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 440.8104553222656, + "step": 71, + "translation_loss": 2.1279799938201904, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 46831.6015625, + "step": 72, + "translation_loss": 2.331458330154419, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 3356.504150390625, + "step": 72, + "translation_loss": 2.4402761459350586, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 2117.06689453125, + "step": 72, + "translation_loss": 3.1276047229766846, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 120360.9921875, + "step": 72, + "translation_loss": 2.8311080932617188, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 269.3521728515625, + "step": 72, + "translation_loss": 2.5502431392669678, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 46177.3125, + "step": 72, + "translation_loss": 2.1733713150024414, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 1355.48876953125, + "step": 72, + "translation_loss": 2.2752811908721924, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 7202.33251953125, + "step": 72, + "translation_loss": 2.6413686275482178, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 1125.8641357421875, + "step": 73, + "translation_loss": 2.4181323051452637, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 46261.85546875, + "step": 73, + "translation_loss": 2.023967742919922, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 306.3546447753906, + "step": 73, + "translation_loss": 3.5692965984344482, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 460.9762878417969, + "step": 73, + "translation_loss": 2.2976579666137695, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 18270.265625, + "step": 73, + "translation_loss": 2.240276336669922, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 107.98651885986328, + "step": 73, + "translation_loss": 2.335678815841675, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 3635.744873046875, + "step": 73, + "translation_loss": 2.0860302448272705, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 489.4286804199219, + "step": 73, + "translation_loss": 2.03962779045105, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 1675.34228515625, + "step": 74, + "translation_loss": 2.882436752319336, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 170.40489196777344, + "step": 74, + "translation_loss": 2.0810625553131104, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 130.44747924804688, + "step": 74, + "translation_loss": 2.6264853477478027, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 325.5592041015625, + "step": 74, + "translation_loss": 2.399773359298706, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 215.5019989013672, + "step": 74, + "translation_loss": 2.2175331115722656, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 1829.05322265625, + "step": 74, + "translation_loss": 1.8200099468231201, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 3942.4033203125, + "step": 74, + "translation_loss": 2.530977249145508, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 143707.46875, + "step": 74, + "translation_loss": 2.9543089866638184, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 3059.470703125, + "step": 75, + "translation_loss": 2.528221845626831, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 173.31137084960938, + "step": 75, + "translation_loss": 2.7352194786071777, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 4704.2587890625, + "step": 75, + "translation_loss": 2.662055730819702, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 1886.5728759765625, + "step": 75, + "translation_loss": 1.9085006713867188, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 557.145751953125, + "step": 75, + "translation_loss": 2.4175682067871094, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 12372.75390625, + "step": 75, + "translation_loss": 2.22367787361145, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 218.3714599609375, + "step": 75, + "translation_loss": 2.441596269607544, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 189.05857849121094, + "step": 75, + "translation_loss": 1.5674161911010742, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 169.0945281982422, + "step": 76, + "translation_loss": 2.3991878032684326, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 2555.509521484375, + "step": 76, + "translation_loss": 2.6307430267333984, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 288.32403564453125, + "step": 76, + "translation_loss": 2.550554037094116, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 1846.2294921875, + "step": 76, + "translation_loss": 2.4431002140045166, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 1797.473388671875, + "step": 76, + "translation_loss": 2.167935609817505, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 1057.87744140625, + "step": 76, + "translation_loss": 2.3742167949676514, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 37914.03125, + "step": 76, + "translation_loss": 2.0857138633728027, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.09, + "prior_loss": 1006.4264526367188, + "step": 76, + "translation_loss": 2.3448984622955322, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 2836.814453125, + "step": 77, + "translation_loss": 2.1626334190368652, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 3668.8095703125, + "step": 77, + "translation_loss": 2.5415947437286377, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 474.02685546875, + "step": 77, + "translation_loss": 2.4315125942230225, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 2170.866943359375, + "step": 77, + "translation_loss": 2.2770121097564697, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 237.66879272460938, + "step": 77, + "translation_loss": 2.62494158744812, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 1098.0968017578125, + "step": 77, + "translation_loss": 2.4923832416534424, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 1123.2852783203125, + "step": 77, + "translation_loss": 2.587108850479126, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 1542.0316162109375, + "step": 77, + "translation_loss": 2.945643663406372, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 292.3935241699219, + "step": 78, + "translation_loss": 2.6705925464630127, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 5156.2314453125, + "step": 78, + "translation_loss": 2.374755382537842, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 1185.436767578125, + "step": 78, + "translation_loss": 1.89633047580719, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 73.7678451538086, + "step": 78, + "translation_loss": 1.6164666414260864, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 152.19821166992188, + "step": 78, + "translation_loss": 2.3825860023498535, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 350.1268310546875, + "step": 78, + "translation_loss": 2.1219820976257324, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 156.78036499023438, + "step": 78, + "translation_loss": 1.8455872535705566, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 812.3766479492188, + "step": 78, + "translation_loss": 2.728545904159546, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 4088.561767578125, + "step": 79, + "translation_loss": 2.096165657043457, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 126.16314697265625, + "step": 79, + "translation_loss": 2.4692976474761963, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 2499.446044921875, + "step": 79, + "translation_loss": 2.6493308544158936, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 787.2802734375, + "step": 79, + "translation_loss": 1.8695296049118042, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 12054.025390625, + "step": 79, + "translation_loss": 2.845316171646118, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 623.5188598632812, + "step": 79, + "translation_loss": 2.2024900913238525, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 238269.5625, + "step": 79, + "translation_loss": 2.902215003967285, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 18064.404296875, + "step": 79, + "translation_loss": 2.6274876594543457, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "learning_rate": 3.9500000000000005e-05, + "loss": 2.5623, + "step": 80 + }, + { + "epoch": 0.1, + "prior_loss": 2001.1611328125, + "step": 80, + "translation_loss": 2.4772965908050537, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 2402.568359375, + "step": 80, + "translation_loss": 2.689046621322632, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 264.2572021484375, + "step": 80, + "translation_loss": 2.026789665222168, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 938.2894287109375, + "step": 80, + "translation_loss": 2.5126726627349854, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 9197.4658203125, + "step": 80, + "translation_loss": 2.959162950515747, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 5819.6640625, + "step": 80, + "translation_loss": 2.448514461517334, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 199.6078643798828, + "step": 80, + "translation_loss": 2.0148887634277344, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 79.2563705444336, + "step": 80, + "translation_loss": 2.021865129470825, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 819.3015747070312, + "step": 81, + "translation_loss": 2.610509157180786, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 574.677978515625, + "step": 81, + "translation_loss": 2.372159481048584, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 3408950.25, + "step": 81, + "translation_loss": 2.1979856491088867, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 540.3392944335938, + "step": 81, + "translation_loss": 2.2391409873962402, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 3631.97802734375, + "step": 81, + "translation_loss": 2.680905342102051, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 3998.156494140625, + "step": 81, + "translation_loss": 1.8267731666564941, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 465.940185546875, + "step": 81, + "translation_loss": 2.2211835384368896, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 2286.105224609375, + "step": 81, + "translation_loss": 2.9622690677642822, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 4246.5322265625, + "step": 82, + "translation_loss": 2.536022901535034, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 174286.984375, + "step": 82, + "translation_loss": 2.3389103412628174, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 797.9469604492188, + "step": 82, + "translation_loss": 2.4519875049591064, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 168807.5, + "step": 82, + "translation_loss": 2.849557399749756, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 83004.625, + "step": 82, + "translation_loss": 2.1897013187408447, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 5352.6201171875, + "step": 82, + "translation_loss": 2.5462958812713623, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 137.6193389892578, + "step": 82, + "translation_loss": 2.001232862472534, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 5683.79443359375, + "step": 82, + "translation_loss": 2.2103006839752197, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 1044.3480224609375, + "step": 83, + "translation_loss": 1.6589534282684326, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 50112.0, + "step": 83, + "translation_loss": 2.8941993713378906, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 1980.326904296875, + "step": 83, + "translation_loss": 2.0835845470428467, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 1012.2288818359375, + "step": 83, + "translation_loss": 2.499967098236084, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 637.7876586914062, + "step": 83, + "translation_loss": 2.297672986984253, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 3110.8232421875, + "step": 83, + "translation_loss": 1.825978398323059, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 7347.40478515625, + "step": 83, + "translation_loss": 2.0527329444885254, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 1162.50830078125, + "step": 83, + "translation_loss": 1.9670913219451904, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 1952.669921875, + "step": 84, + "translation_loss": 4.018213272094727, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 1194.5137939453125, + "step": 84, + "translation_loss": 2.059953451156616, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 1367.754150390625, + "step": 84, + "translation_loss": 1.8094265460968018, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 6145.65869140625, + "step": 84, + "translation_loss": 3.056333541870117, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 1274.10595703125, + "step": 84, + "translation_loss": 2.229384422302246, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 737.7621459960938, + "step": 84, + "translation_loss": 2.2222633361816406, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 2698.946044921875, + "step": 84, + "translation_loss": 2.483255624771118, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.1, + "prior_loss": 2241.23486328125, + "step": 84, + "translation_loss": 3.4774515628814697, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 4731.48876953125, + "step": 85, + "translation_loss": 1.7512654066085815, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 16231.201171875, + "step": 85, + "translation_loss": 2.699326992034912, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 7562.39697265625, + "step": 85, + "translation_loss": 1.8780508041381836, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 1232.088623046875, + "step": 85, + "translation_loss": 2.0843310356140137, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 254.7690887451172, + "step": 85, + "translation_loss": 2.2796287536621094, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 217.3579559326172, + "step": 85, + "translation_loss": 2.026595115661621, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 13733.935546875, + "step": 85, + "translation_loss": 1.7377129793167114, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 188.67626953125, + "step": 85, + "translation_loss": 2.444002628326416, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 5861.82421875, + "step": 86, + "translation_loss": 1.767945408821106, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 994.6979370117188, + "step": 86, + "translation_loss": 3.506460189819336, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 3316.9091796875, + "step": 86, + "translation_loss": 2.434568405151367, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 1316.0294189453125, + "step": 86, + "translation_loss": 2.1717705726623535, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 161.98231506347656, + "step": 86, + "translation_loss": 2.8988285064697266, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 321.2611999511719, + "step": 86, + "translation_loss": 3.2503113746643066, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 352.31488037109375, + "step": 86, + "translation_loss": 2.963773012161255, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 4202.13720703125, + "step": 86, + "translation_loss": 2.2531118392944336, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 674.2916870117188, + "step": 87, + "translation_loss": 2.3830394744873047, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 1452.8388671875, + "step": 87, + "translation_loss": 1.7052921056747437, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 159.7821044921875, + "step": 87, + "translation_loss": 2.810800790786743, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 5891.4716796875, + "step": 87, + "translation_loss": 1.946199655532837, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 1198.809326171875, + "step": 87, + "translation_loss": 2.3743035793304443, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 847.7337036132812, + "step": 87, + "translation_loss": 2.100919008255005, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 814.1531372070312, + "step": 87, + "translation_loss": 2.080592393875122, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 139.66612243652344, + "step": 87, + "translation_loss": 2.521650791168213, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 1025.173583984375, + "step": 88, + "translation_loss": 1.747448205947876, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 538.5001831054688, + "step": 88, + "translation_loss": 3.1119630336761475, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 979.7647094726562, + "step": 88, + "translation_loss": 2.0388121604919434, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 1572.20263671875, + "step": 88, + "translation_loss": 2.1341307163238525, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 523.95703125, + "step": 88, + "translation_loss": 2.297985315322876, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 166.04342651367188, + "step": 88, + "translation_loss": 2.7449698448181152, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 519.5118408203125, + "step": 88, + "translation_loss": 2.0986242294311523, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 782.2055053710938, + "step": 88, + "translation_loss": 1.9546115398406982, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 2256.236083984375, + "step": 89, + "translation_loss": 2.702674150466919, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 3004.922607421875, + "step": 89, + "translation_loss": 2.2749221324920654, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 8808.826171875, + "step": 89, + "translation_loss": 2.7419092655181885, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 577.4176635742188, + "step": 89, + "translation_loss": 2.4940292835235596, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 269.16473388671875, + "step": 89, + "translation_loss": 2.7845685482025146, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 3388.457275390625, + "step": 89, + "translation_loss": 2.50451922416687, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 1633.1163330078125, + "step": 89, + "translation_loss": 2.893672227859497, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 1223.0601806640625, + "step": 89, + "translation_loss": 2.5179295539855957, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 3215.2724609375, + "step": 90, + "translation_loss": 2.3868284225463867, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 433487.4375, + "step": 90, + "translation_loss": 2.8418776988983154, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 1199.5767822265625, + "step": 90, + "translation_loss": 1.6513601541519165, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 367.93511962890625, + "step": 90, + "translation_loss": 2.8715381622314453, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 1397.85595703125, + "step": 90, + "translation_loss": 2.3916239738464355, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 2871.351806640625, + "step": 90, + "translation_loss": 2.495706558227539, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 833.513427734375, + "step": 90, + "translation_loss": 2.3677945137023926, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 1221.408447265625, + "step": 90, + "translation_loss": 2.7376444339752197, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 525.41943359375, + "step": 91, + "translation_loss": 1.5740571022033691, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 626.1222534179688, + "step": 91, + "translation_loss": 2.5919065475463867, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 1130.6845703125, + "step": 91, + "translation_loss": 1.9024004936218262, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 2474.5625, + "step": 91, + "translation_loss": 2.0560028553009033, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 308.6060791015625, + "step": 91, + "translation_loss": 3.3840701580047607, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 157.11599731445312, + "step": 91, + "translation_loss": 2.810793876647949, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 14111.8681640625, + "step": 91, + "translation_loss": 2.3617758750915527, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 2437.5947265625, + "step": 91, + "translation_loss": 2.6349284648895264, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 2745.396240234375, + "step": 92, + "translation_loss": 2.1992502212524414, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 20505.076171875, + "step": 92, + "translation_loss": 2.6522397994995117, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 212.1503143310547, + "step": 92, + "translation_loss": 2.6325151920318604, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 2466.689453125, + "step": 92, + "translation_loss": 2.320836305618286, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 4438.78173828125, + "step": 92, + "translation_loss": 2.303989887237549, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 3362.9697265625, + "step": 92, + "translation_loss": 3.1038637161254883, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 2832.436767578125, + "step": 92, + "translation_loss": 2.4199228286743164, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.11, + "prior_loss": 493.4430236816406, + "step": 92, + "translation_loss": 2.626748561859131, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 1164.4012451171875, + "step": 93, + "translation_loss": 1.9225282669067383, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 128.4334716796875, + "step": 93, + "translation_loss": 2.061525344848633, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 39278.9296875, + "step": 93, + "translation_loss": 2.9530439376831055, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 4853.09765625, + "step": 93, + "translation_loss": 2.955043315887451, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 988.74853515625, + "step": 93, + "translation_loss": 2.463852882385254, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 1496.3431396484375, + "step": 93, + "translation_loss": 2.2266876697540283, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 68039.8984375, + "step": 93, + "translation_loss": 2.215089797973633, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 1089.982666015625, + "step": 93, + "translation_loss": 2.0422778129577637, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 1244.820556640625, + "step": 94, + "translation_loss": 2.3686108589172363, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 272.6587829589844, + "step": 94, + "translation_loss": 2.327025890350342, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 489.7776794433594, + "step": 94, + "translation_loss": 2.5966081619262695, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 13665.3310546875, + "step": 94, + "translation_loss": 2.257702589035034, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 3116.8662109375, + "step": 94, + "translation_loss": 2.252854347229004, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 265.9984130859375, + "step": 94, + "translation_loss": 3.1114156246185303, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 17880864.0, + "step": 94, + "translation_loss": 2.673755645751953, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 181.9965362548828, + "step": 94, + "translation_loss": 1.7087515592575073, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 535.7645263671875, + "step": 95, + "translation_loss": 2.6441538333892822, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 3762.96923828125, + "step": 95, + "translation_loss": 1.8098499774932861, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 63450.05078125, + "step": 95, + "translation_loss": 2.4029808044433594, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 245.46275329589844, + "step": 95, + "translation_loss": 2.1181538105010986, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 5470.880859375, + "step": 95, + "translation_loss": 2.4144041538238525, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 1518.2252197265625, + "step": 95, + "translation_loss": 1.8114609718322754, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 194.05186462402344, + "step": 95, + "translation_loss": 2.9043009281158447, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 18542.99609375, + "step": 95, + "translation_loss": 1.7459291219711304, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 17439.513671875, + "step": 96, + "translation_loss": 1.9398523569107056, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 300.26190185546875, + "step": 96, + "translation_loss": 1.764165997505188, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 1511.056396484375, + "step": 96, + "translation_loss": 2.4673428535461426, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 3338.33642578125, + "step": 96, + "translation_loss": 1.9559627771377563, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 568.9901123046875, + "step": 96, + "translation_loss": 2.5658740997314453, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 6277.73388671875, + "step": 96, + "translation_loss": 2.4446990489959717, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 2840526.5, + "step": 96, + "translation_loss": 2.0065083503723145, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 45670.02734375, + "step": 96, + "translation_loss": 2.296529769897461, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 500.1962890625, + "step": 97, + "translation_loss": 2.081814765930176, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 179.81248474121094, + "step": 97, + "translation_loss": 3.1804723739624023, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 405.95208740234375, + "step": 97, + "translation_loss": 3.09875226020813, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 3161.065185546875, + "step": 97, + "translation_loss": 2.165872812271118, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 2794.010009765625, + "step": 97, + "translation_loss": 2.244804620742798, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 2425.6669921875, + "step": 97, + "translation_loss": 2.1301333904266357, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 264.772705078125, + "step": 97, + "translation_loss": 2.6575262546539307, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 11592.583984375, + "step": 97, + "translation_loss": 2.2070670127868652, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 815.761962890625, + "step": 98, + "translation_loss": 1.8119982481002808, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 756.2555541992188, + "step": 98, + "translation_loss": 1.7990299463272095, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 645.7431030273438, + "step": 98, + "translation_loss": 2.862051248550415, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 3868.37060546875, + "step": 98, + "translation_loss": 2.153024911880493, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 1594.5635986328125, + "step": 98, + "translation_loss": 2.2460052967071533, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 91777.1171875, + "step": 98, + "translation_loss": 3.550994873046875, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 437.5003662109375, + "step": 98, + "translation_loss": 2.2599036693573, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 180.99166870117188, + "step": 98, + "translation_loss": 1.8803231716156006, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 1573.092041015625, + "step": 99, + "translation_loss": 2.405677080154419, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 88930.015625, + "step": 99, + "translation_loss": 2.264021158218384, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 827.8090209960938, + "step": 99, + "translation_loss": 1.9022517204284668, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 6368.966796875, + "step": 99, + "translation_loss": 2.393932819366455, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 1497.4859619140625, + "step": 99, + "translation_loss": 2.315967082977295, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 3742.3408203125, + "step": 99, + "translation_loss": 3.3975725173950195, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 218509.8125, + "step": 99, + "translation_loss": 1.7615652084350586, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "prior_loss": 481.5612487792969, + "step": 99, + "translation_loss": 2.749424934387207, + "weighted_prior_loss": 0.0 + }, + { + "epoch": 0.12, + "learning_rate": 4.9500000000000004e-05, + "loss": 2.3838, + "step": 100 + }, + { + "epoch": 0.12, + "eval_bleu": 0.02768705023404104, + "eval_loss": 4.190079689025879, + "eval_rouge1": 0.21952731403473935, + "eval_rouge2": 0.06715399580496624, + "eval_rougeL": 0.16000726579164942, + "eval_runtime": 35.0327, + "eval_sacrebleu": 2.768705023404105, + "eval_samples_per_second": 3.682, + "eval_sari": 36.89731900527743, + "eval_steps_per_second": 3.682, + "step": 100 + } + ], + "max_steps": 12060, + "num_train_epochs": 15, + "total_flos": 667579250257920.0, + "trial_name": null, + "trial_params": null +}