diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8279643c166e1c3c2c0feb3102afb83fc81f84d9 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d0f819cce9e58dbf06d38ac9eb07f0da26cf9c96f4140cfdd743b12533aa60e +size 199058647 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f0ae074a30294a783050f438697c99b516fb7d3 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38ecad11c5cd56f669cafa59e839a5585adeca341b7c42ee994f233c7e95676e +size 199058647 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9df98d0532828281ab414f96bdb321d68e443b4b --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee80a2dc7b13f13dd6f409c89155694b42503ea7dfdceb4691b24aa6664b8b55 +size 199058733 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da028481651109bbb8c21a54da76c839f5e73218 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcae55dec810555cd4a142a827da37eecf777fe60ad6fd35306be11a7d3cbc1e +size 199058733 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8aaa77c7751e7d1e206a912bddf07a08542ae1d4 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2ea4ff20b8424859e566e52088ec1e80c4016b30e72f94a30aaa86ef0a65b39 +size 199058797 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7be4d320964ffbe1e0a15f080292d752c05359b3 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:790956b7805c948a0e923db764ce00e2607f592381f472abdd5c7a1e441ecb83 +size 199058797 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdd021d5b1362d460a1288cce92571246249db68 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:485a7663b4d75c4900c6ed5c75cb3dc0c60c7fc7295913274f2b16cf733b0a5a +size 199058733 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd5fc2ac2d5d740fce3f7f4e2bca40086b0c5b15 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bb89d7233c8b1da0f521d8221d17d9bd1e204fc9bf3f60454cec39190b6b5db +size 199058733 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8d6ae22750cfb0cfc20dcce549c9ed770c8dfe3 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4b2350ec5ca6c07c5ec0a5d1ddb9fb0ede0be1c6eea9827138961608093566b +size 199058733 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e74e847e25f22fc51dff2d6e96fd1cad091c4a9d --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05ae92c87ffa55c774524519194166d98d592a23a2cbe715756e61bfcc4d1f29 +size 199058733 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..92a5116ef9e63520ecb05c8c5b2dd5afbf433f82 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b9cdde754febf7d7549191f9db1d59f461a4b2f5a7a29390c473eda5afa5f61 +size 199058797 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7046e54958e48e2bffddf720663974df106c2190 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16167732af27ca85e5df392edb40ca2133bb740b94e441ff6ed66e9476c3d410 +size 199058797 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..855295749d342012f288abd743da882a80dcad98 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1136f0dec5185b0aca8b8f2d002d36b778406c795bd1bb172ed559ba0dc5e3ca +size 199058733 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3dd3aab093682d3f5c42f517f19c0264e222c2c --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59982bdb5b271f8e652b61b290b3520426e92da4d4940149baf10a4fe7d0bf5c +size 199058733 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e718194f77762a7888eeb2f6ba1fef8811ac971 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed9dd5ed903047e743c592e7ca160c8a01d6fe9878b580010cfdf2faf5041c9d +size 199058669 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..197c4731aa1d6134d7d06a351a88af8598f9dcc9 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55944a51c9a6e847ba36501eee80db3189c0f914e0fc1b267e2cf4b2ab0c85a5 +size 199058669 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..43acb3d4a6d8b6df7d430e28f5bdaf112c499a80 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56444934650d73387e0335f83cf54f14685805ee3bcdf7b3524aaa23318d498c +size 199058797 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba55c26262345d273c152209dcf0f5daaaeed04a --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2147a19e285b89c6bb61955596298d274bd74ac72acb4804fc2913e4365e4e9a +size 199058797 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..449fc6d49d2b4d32a118cfe8add6f8e98360ac0f --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51d587a5b9721fcb546f5ceef04c5be43df350b6d905e67af59161a0d14e3952 +size 199058733 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f63d1a801f99fd131984a7d473e622dbf79ab83c --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4198cd3fcbea48409fcd6a2587d1460250852ea25584bb6b6937ec46c6b4af27 +size 199058733 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a86aed91752ec4a432782f54f6e4db56392cbe99 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f63baa11cae5081ba3bd05ba41a4c4956dcefdb783e11cc2865f6b91cc27829 +size 199058733 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc826ac20e0d75a8403f4ba3c003febb448b5fba --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c48bd1c4e09fcff8261858b4e35083e35bfa35348631a403c3849f0968466e6 +size 199058733 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4218912e663bc2f844fdd78dc1d8e14e08382162 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a657bd122517a342b4942894a67383792ae16a245ba19ff24b06367399290ede +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6e9284019395c82c4635910a7875031235d29bd --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:253ac5e394e7a3ae665d10d50d92a46989e3ac1244cf42199ceab370b10fb8a5 +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae023261036e8ef5b8a921211d03fafa989323ef --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f9a0343d08eba3b9afed9c62d9bae69b40ed5bea9f56467ad7d8461ba9d230c +size 199058733 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..42ba88742d64abf35e3a1775ae894236db110678 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95126bcf4eac2e24b3dae91a1939c6599ec410d73bb3c25868829c6d3e266e19 +size 199058733 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d71bdceacdb598f8b5fe98b587c8f347400022cf --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f66cb0bd326154153928aede2b4744fced0235eb413d44bb72d116791aaaa24 +size 199058797 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5985d7a7d6bd291426d9d3b700f17579dab08274 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a59070cd5f8f45574e4cc22c29cce2ef9bb4f98318be7a56f578a7f0e8020889 +size 199058797 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfd53c5c49147eacfaff6bf5b140f0a16efc91c9 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcfa26032d6a16a8930f59a57133752cb668dd8c28a2ea8030a077def016ad17 +size 199058605 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..98e740900e94e1a6af0c2fcfc122b1b94987eab0 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6270060c2af9605acb473594d62c05cbd1ffa3cc6bd89a9374290bec0fbb75f +size 199058605 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..81fe582aaef716c12b423fc867a90d29097ed4d1 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bae397a01195b0ea07bca9675d2e017b9a9c71148c88625a2a29f58e44690fd3 +size 199058669 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d3fdcb78a7a5d3837a4dc98417615a9e9280815 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea1bfe7b33a83d58d5d9b6e2ba65f316eed3caadcf9d3a2b01918e60c3923f0e +size 199058669 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec2c0b4e6aa4977c1ef5de68855c62642811048a --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60830b66aea6b9fabb9874c5183a1ca801cc6dbd8e930df5961a2024d0d91919 +size 199058797 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a69676113b3f76cbf053472ae6516a8281291988 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63ee8cf652e3de01635fcb663834a53488fa5a21bac56023ca429b9f2bf6fdd2 +size 199058797 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5271717d64cfad4dcdac68e2e07deaeddc663e0e --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df7f841dd3c5063c8313e3a208e565495637380890ed1367b877071a37aeb849 +size 199058733 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e637f5efe6dd0eb679cb9b7fbefa9e32c1ee0e3 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e62a6cf523f8a6efa33a642ba0a94919362e8f36fd045113b319c2d0ab4d35a4 +size 199058733 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..72f11036be25d54fb4a5ef9be55bc2987ae9b657 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b488a57c519e96f3f8b0a77cd56e4a40841e41a55ac6d75d7e4707bc192cd891 +size 199058733 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6b3d84467666bdf2e6c2b01118ea4692d256f3a --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28aea2f7ceb86cdde9e7116fe45ccb98761d5bd03b1706e8fd7970af29ff4281 +size 199058733 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f2c60a23f7ce0cb2f6a65c0c25ae4e392a01024 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cf3c327c7fbabe8b630b3b4c473eca799e12f4af9d28031da9133e3e7194644 +size 199058733 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..96e22f27cb645aadea7ed8b4acf844a4ba7d298f --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c9178daffb6fb0f4a6598ef9172e8d9c2694693949d031fa980eb4420f1fc47 +size 199058733 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c8fe56a71ac3455cd373723819231d8b8e26e65 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62c888d920d09574bb78617e9e1520675f4dd88038bd3599d13641b459b03b2b +size 199058797 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec992e505f863efd50faaea848bac34bba5e8e4e --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7ec38e98475df3b7e231f55791c77c780b6717fd77caad07c9811eb2d2dccea +size 199058797 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de7bde9f49bcc22a3fb94d8a121e003e10486c93 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d558814c40d0815cd0449550e63f7d85d2c14322e315897e417b1b7ab8cb585 +size 199058669 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5dfffdce3dbd2fa98088965d06f5726c9f0701b --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfff2fe3334a511f604a68c1b83a442556946dd1fa3b2ba054ce2fcfd5874153 +size 199058669 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..088cd5a07ad9a0917c16c2e4251e485c94b82113 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a82161e60a44161b8b29b31b6d9511711a1c008cae4d3cffe7d7a2048be0928 +size 199058850 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b19de9a6a6dc6e6c8088dfb7e07c1fb1342c1b66 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a66c24b668260c3c5ae0c3337a409be897b7a55d5ffbf288b117a4a9114dbc8 +size 199058850 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..087ba880141d7d60c827f08761b3bceac6a68122 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4d770597d2ad43c7ce72af181f5f8ac5c502de04523366d1b088c53124febfd +size 199058669 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5dbfa007901140a62baf9f2eab31eee398925f22 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42c4d28df950c7c8ecf706caaad670f788582d4a1da4c4204b612d35b1f664bd +size 199058669 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..58dba2abad03f41298a3a69a1fd796beafcc9d99 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2e1dbe8783ff3b42074dbad25c987b4d155c9e6618c48d44b0238157512c040 +size 199058797 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..acee3aec6ef91be5f6acc8c69fe62369e988e31e --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79c31a158241daa15eb1960944988875ef6baf74f77b25257c6bb87dccf79e35 +size 199058797 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..675892654c6aab117a7ba9269fe50d5a4338af6a --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9506561c6b6b8e00130230b5cbae672016df42c9a76881e7b3c59b2f1c1573ae +size 199058733 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..df4c928502a549e85a7d421756067e49af54f52a --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ca95c87fc857b44a756bd9b1b19b9f192536645edb5afcc6870abd817f80a71 +size 199058733 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc6d70ccd8036793354491df94456468b26f082f --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1249ab6d4a5dae4616aae6cf2bace32421494ffff5f535ef9a97bc2fe7ed220e +size 199058733 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e111dcf82d0fa5d92a8d82c6d6272dcaf37c4dae --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a07834f4e70cfed2ccb18b7e04d32b35a54ce404a6ef84a236834b51ce228cfa +size 199058733 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ac6dcdefbd66c7629d22dfab56c89c666b2c4d9 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89f87f9e742eaae04b4de0c646fc96fe25d77777de3d7e6b3c920c4fdc64a9d9 +size 199058669 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e591e05c43740b30a06014fb5f4798e883c0882a --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80419784cc4aeaabd006af6501d1d665b6adb22f7782e1086222d0863fe85661 +size 199058669 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e68ee2210142326b996810e002cc7733ad8dc8b --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:056f95c055f77d52635f49881183d0707b630c2c0b0e3168a3c910222ea64d87 +size 199058925 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8a7cf39b1db4b72d8e065006f8bf944a52f3c5d --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99a440c3320ae1031e894eb4f5e9462dc95626a07ba694eef0ee45ede15d66a0 +size 199058925 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1dc6c4dfde0d340093bd7e12e310c7e77f67fee3 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1a61f7e3efca3d529b07c1144dcb91d033bec7170c63fbc03a0abe854ac28b8 +size 199058605 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a012fc162d636d778cf317d7d8cd0b0db8dc8ee --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db9891a7184246f96db10e8da75273e15f41d9bef5af8abbeec039ce4aee4aff +size 199058605 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..98974d7ee63771b5860338b0f408b85fbb3be3a9 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:497401a3554667c28f9cd4ee821ef73ba0fcbd1d7a975c2fe006d877a99bcd23 +size 199058605 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9067ba610a654301422dfcb5b0fafc46b50e9f76 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21cd78ea9678a4be4d84a84744512d6be2cd88131c364628a23f8dbe34f7f6fd +size 199058605 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..312496a0f2bf58fa93ad16d4573909a4a5218f55 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa76082dee99972788bd2753e6127787fe55fa24379c9091085270d6c9c71ac2 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e1d27500305d45b91c6934606edf423d88acd8b --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64b0351da5be62793381db8b6c167581156dbc1bdf69ec2c7911b49d285dd274 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cae418bd7031270e6ae859fad1c0f4567bc82509 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8abdd96b4e4ee4fc6efb8392f47b6b559dabe36ddb8d9aa48ef2824a3726c1ad +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2588db982d094e90be96e4ea95aea991906cd6e4 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e38f788b4f73cd6e17908a87af4f6719c2c4e90c49821f969245edffbf1167a7 +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7dd547e525a61f6dbdd8b9088587b3161c9e20b0 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ce528b0a599e967ce2b42ba1c4b33f9d4460a39224e8359eaa04bbb6a8cc1d3 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b099a66ff00e58846651991bced4710c31c81ff2 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:236e2c83174beb7ccdf8165168f24ed9b75892b0b8e3f1e86194905882aff2df +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec3707436cd95bde2af9453b156f1cd34ec94dfe --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03e2c2e9951e94db7365a15b10022798a917ffd6cccc5e4561145178f74df9da +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3280dd53173f3ffdf1a83e05f4f6bd5fd8f603f --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:775550266ab2c721ec7206448a17aefa6923b9c779d73eb08f2e4c096a7604ad +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3731eba6308a8576b84ac7d084b192a5f215af57 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9a36384144d9ee6583d8f71a292db2f47b60889dddefb0acf9eca9c42694e55 +size 199058786 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad8066aa2e9f228209cb0eb0906bddbee5ccaa9e --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:513181c46bf5715ff594f3fdf14d819b2453a307e4785cc6ad5f98e0e2d27b79 +size 199058786 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..08cc1fce51980692774acd48550013dbeb379927 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8621395e4f2dde4fd76c03b00493c8f3de5ddb1fcb169f52f1e610e3e2b9242 +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1df43a30822e4db8a1e2499b13954b81a95a7362 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:232ba18ef42cf61cdf347ddab073c6756d9881767ebf189a577cb0b1b4c9220e +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..79b290b13e766bf4c9f1e4cea9e702a3344124a4 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f40af942908de8bd9634accbd08f8785da0f450a2f03053d820ed15432fef35 +size 199058978 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..650b1178a15b77d35148083a614c01ddaf9ed4fe --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ca5dbf7a3b9e941bd3371521e39d7ef9b158653422c911f956807159ace708f +size 199058978 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ade47e055d7ba90ac737024f6f9e434bb6bebfc --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b5da11cf450210355bf9bf74accc177573894c40ede2104e8fd0c8fef4f39c4 +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..54f3433a574efcd60728d8cd62152eb0001d1487 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2f8761984093511346bd5753bead5f76e6dce7970eaa663ab996f868f100ed2 +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..83bd852c0021664fea583b8182183721995a6e14 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f38f49494bfff14595722ba109ddfb56a755f59f5754332137521f91a208caa +size 199058647 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe80f7a0407057a1f3bf0ccd6144149ec630ec2a --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1271430edfe9b9036369e4dd035f2f9e3d4e33a977439229ec8fbec2a3862353 +size 199058647 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..954249735dcfaea3fada96b3b30e4942cb11293f --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1340b5f30e4b654791be1655ac51bcc61ed25054be34d99936b5570f3ae1a9b5 +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5cf9b68e4ce7994f0873ef0089c1908b64c2609 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4e32c78da71fe02468ab9d3dac7e50f58ff85ea455ebfbf2b2d9a84a561ba4b +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..795ed936a8738c6d688f875670198643e9c3eb40 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ea0fc937356da1252c94779cb98b4460f8d02b211264818dd46353a222266dc +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0a6c0ffbd9ab54fa5b13058f0471f06665c6f9e --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ad411f0a81a5f0356068f0aa5b94e3a8bf6fe55badcefd58370d64d6aad3feb +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2d6e475b780244ae6d1f52698fd01f7bc5e5139 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e71676b78ec719d0a2eb6c8b16d8b7f0dc7aa9214cfb70ec53da3e535ded829 +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bc3d2ab562ee4bbbac89be2cad470dc629c72c4 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0459ec2229a44f9c2f8bcae8507d40a161f0649ea32cddbebb4b357db78ee631 +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..88a837edaeda6a29f3d95afb79d2782aee92b689 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee6ec2e5a81e9b3568ead74885cc2493ea4a106a32f5350cf9af7a707800c689 +size 199058786 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c445913c3349caa10d802461f6c69b9e508eb4b --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9a064874867bdb6c6640a9c7707a1d84bca09be563baa0ca5aca2b239de4958 +size 199058786 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bcbfd433ae8f46feee34f9a995aed74380ecb657 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed3f442436f7560a5fa82e9db3d5e0692dbc201ff536a81310cb21a0103e0258 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5c969f376c0aa52894e655a627ba8930680e3b3 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:430bb07fe70047e8fd6e7d2bcbecb109fc2e2b6ce629990350c608b950748859 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0449c1a3831d2afc688c2cfa063015399fd72a40 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9bf40bbef79a4f73f032dc7181890b37050e41cf274e0cd341becb16bbde737 +size 199058850 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0fa9cb3637561322a9341814fd1d176893935f4b --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a61e24f6cbb5db0df2242a25b775732420fd3327bf43c51a7a9d2ee9611d91f +size 199058850 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..272987bde82abe077f610543d20d5f9382730379 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48f64f0cf2db05630e87aef169bec5cb00d40b27f929bcea377d7d11aecf0635 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..26d6799ef4636dd6373dd02ace8545917bbb5632 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86286efb1b214760ce55cdfb285a57f2bad6da0def47559707a1a386deaf1ba4 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..497e2e66c78acfbd2ecc3af7cfdb71388c111adf --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b20c58d0d0b10b15468ef74b2e0e4301d7544049a890b883d9db7876b189fee +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..12cebe859cf0761f9f4cfc7989a8ad0d014b3daa --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:420bbc0ad452de83887f01291771e31dca2b128905fa32463c2f5314b658088b +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b36b0aea1b6177653064cec3130aee7ab4694a28 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11fd1dde76d010eee3ce7f40ac2b7aa1122b6f00076c7a80f799bd47e63eb7a8 +size 199058594 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aef4323753ce41250a4671f3aa9f1f493d853cce --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d03823cdff1ed1960666150c5c1cc4c168148e70df0bbd2182801e0a3405d0c6 +size 199058594 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c4e7b49b5508ef8716e134047d8b27e47818ab4 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3256b6209322d59f5ee2245bb248d61315f865ea0309e13a044de1158746e983 +size 199058786 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..087e79f28d158e3ea2f7096965ebbbf27e72f9fe --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:246e52ac57b2a07e91e3ea1e10d74ae1adb9675aca990e8442083684df01984d +size 199058786 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7bf8bb845c93c3a72961a6c04c2f6e61b189f82d --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26e3fa2a8ec51e9fe4afd78859f261fa37b8a3da890407b724bcb8e55d44ee3f +size 199058711 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d212536f077f20a92f0372d73177d60e0bee94a --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be7b4d7ba61a2f43c0cbc82dc03a4f48496b31b73f2bed6ad47ecbc14a20d1e9 +size 199058711 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1badd0301944c3a517744af212a2cb3a9b8e18fc --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9da65e1e43374f4db4fdf4f77c5b962d25b0b8004e506d7bcae171fd497142ed +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7b8cf85fcdaa21e63a7838b2c40265004d1df3a --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d061d13c8e90ce09ad7268392cade6ca350311374e8f6dc92073823c38af3e9 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e4718dabd819a5bcb53abf6cb2db7778e3b2ef0 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c0b5d4b90d7d586f623707d7345ba949a4eb10b761f2da8a5ce0cb9a3c67b07 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce120f0d503afdbd6c1943a3af7610a4bf42e8ec --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41053f535b9876c99572b5aa379d773daa7d5e27d169beaa71ce6d974593fc9e +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e27ce0ef02a31e28565e30260f27a8273b4e69cf --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d52835042385cc91a0ae889ba5424eb87529f356ea36266ede329a6d561e344 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4594ece5b7613c1bc23ef55a23e1c6ab73226a2d --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5888f08aa7d6a35f7156c3de9dc8888505423dd26a47d8e6d3eee6f0344c24c +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..25df409d19414269a885d983ae8d13951ee2b595 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc0ed788569dd43d45ca71a6f59ca723c2955a0954097dd368214581a654bee4 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..968fb31f260aad7be5c49b57c363aebdedf929f6 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:604c98a9d4a7caacb716a8cc33e9117bf8e9d1e115dd4809cc67af5cd84c031e +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7add051e887ec0fc70d1eef9167054261a4fd01f --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d55aeff00b4bff9e9510c3a0bf7b7161a8181a0342ec5f1bcb02233abd7c353 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3dc39f6ae6d6a887a5baf7a4a9e0e8c797f3b2d --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf98e3ec75bc7ad029e9d27742e4afd568672dbf00f7796d99daccacde07c561 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd0154998b201e179df6e70372b7c9ef55a08fdd --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5178cdec22a76982224cfdd6ce3db2a6d90f5d13432150cfa16c3861eaf9159 +size 199058594 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..04252d400075ceb04089937e4d453745692c34cd --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbd114039104efce9d9cfc626860d9259af15fe618892a0249af73572b882328 +size 199058594 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1dd2648b0c800b475043bd5c20c414246896e11 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1172b83547575da721527fe0f9cb35cdc1cdcb7ad66aa920d3f57ed016ef8d91 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..16139e18ec80c982afb5d5f2693e5bee9116a83a --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b8e58efea2d7d414cbf1e8b7f4826455394644aae87fd5f223376aad18e3ab6 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8b26ec5b7652f2339f07a01398ff2f792908776 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e93cbff0ea5764f23c6ca9640faa288f22d059cb7cbb6291ec183d1909279672 +size 199058786 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e634756e99c94f9360ddc16908faae4519e906b8 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e900f0660f947ca6bf1f62b27df72df706f2bf5217d61476b288fe67ff9b95a +size 199058786 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..352c0cea1dea93bfc0143477ad2ad8e2f20a7953 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58e70ceecf56a9d356e58a17d312ffefb0de2d605159ce5f39329e4905e0ec09 +size 199058850 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e1dec1a88324f9ec67c51fc657c27a6c03f06ca --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bedfbe785e354d58bef0523978749eae2e5ef4ec67f06af78eaa0b12375cb64 +size 199058850 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa84b908e4e0f642280aff65966eb88f2f388cce --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4d0842d751f91cc603b55f405a8f9be602cede08d52a65d3efd96a8484e3c14 +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cad4e983353ea825e565a44d2c76bab18cdb91a6 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4092a7b846d5e24be47fd9dc0b380d4b5b7994812410c28779ca2ca12a2daa4a +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9207f252fe863be40bc35f8f1157b29a54322a5e --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e8a47477207a9ce5ee8221331845d2aa4bee20b6f4f27583d8ab52f8d5734ba +size 199058647 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c20f4ab5de9c1dfe9a5a434edde1b7fd42a9016c --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4cfaf19427081f0e2b18f5e4c1d68d253dccdc851b23aca93fe671c58aa82b0 +size 199058647 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..822a828db42c148543bc55a04988e17fbb6ff5f3 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a0a33b65fbff1f87b410da114d6b24b35f78566cf268d02042c63a0053613ad +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1328e8570ef828a62e05e866f34aaab9d7d588d1 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d504e4018f9e10e94c43ee08a04df452118bd694de207655d56eab90af3ece58 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..246f2a50bf5af86db139d145274f524a04372880 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e9204b6b1177a41489a7fe5253074aab857be4b289da1f1be713176dab595cc +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..14eb4a82351a1ad31b897e38a2c3b7f8a5dff2be --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8febf05a2b90d5d292fd75c8a3e16b553ff1a44a27178677b818a0beecedb2a +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..46ee341a30ae35379d4bc94ca0d7bed02fc09731 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93f0af9a99e1e4364198bbef8bd1f55bdc01bc3996a7e97e929a1c6a4eb69de0 +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..69964ca5ede4a721ffd87e6b2d9ac6a5e7a267f3 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2d7542fca987c00c653c56a131991bbf295d57f2e1d9b30d11f1fbbe04e054a +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3703dcb8dc2c0c2aa9e555a2e81cf304636e838 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4245d52e76b4a8bde47593ea12a584df4fa56e31b6f17d9cd79675b9726ddec +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c09d74166be9076f4b6f1ad4048a12fccde4996 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c5f79b4c283138239a6fd0079656186a9691ef5ee60f7763da05061e5d301c4 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fbce6a1470f3bb3f955883573d311bf4caa0c66 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5150340b88f12843bb71a5b1cfb82409844bf8cf382c492b723e178739327914 +size 199058850 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b6b016dbf297411361df44dda163b1f6ce41600 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5e22e0c65b2705f2bd5963c51716072729ef2352d38630f5990f46b7dd7da4e +size 199058850 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc32de92ce9ec23c55c02ab8e2eb86983f1d3253 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52de501fc575a5f4ec56f1bd8db0ba594a43c2c2e5f16d925cc0a863824ba489 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d032f96494c54ea37301854d5067c1bfaa54539f --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdc2c3cef54f181543982a1aecbf13973a7f7ec5e19d6cb4219c804cf1b6afa8 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..789bac55d58d2b3b4ec03f0cfb600dc0bde810ab --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13a67574bc00861fad9e578d1a623fb2fbdb027365da2494c93f1779a9240994 +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c73d6d334a1acc55985bbce8768d6f175767c76 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0615209d9f826eb673a85f12004e536bf5a8c7be42d56eb9966a00fc888920d +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2d3a530cf7b4502497bc587b33d63a01e600158 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dc3c9e1a9f4cf6fc33e26d3b4cbdffe686eb55f14c6c8721a237cee780fbc4d +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..acea450eb875e304e89dfbd43430f6bef0879633 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9f5bf58ec665b170fc2d50195a205126040742f8e88724eede66ed32b3d0aaa +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c6c76ced1e47df57415a913a0525456ad435d82 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:064f36c492b335c21a4a54c9333b2e70dbea7c4dfeb03d9b405f95294cd8a380 +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb1ba7069378f6fdd4ab7bf1e0177f990012aba7 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ffa3d9c15d4e54e3d1eb576bec82f9c98f5c39037cc8cc6e9cba18a51bf984e +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a12999848f8da19c8d7c0fa7a4c77d0ebfabad4e --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8993d16ccc3013cbfbc858849c0b11167913887935ddbf3d6402a1156fc34bc +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..73b9e0dacd0ddf96243952dd1387f7807f67019f --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e4f87ef8bd89183b63afa9c267688342e5da20d8be53f7de6f9dcfceb2e0f38 +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5657f03ca06a119592e476f4ba452548565816b --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fbd5e26c56ad14adb9a7115014b8db5d12b425582cddce1cd64cbf695da2dd5 +size 199058775 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..901e5aa53ee1fa9703c87f366f4db3bad9f2cfba --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec5ea0e6d5f4bec3e4891c59c15d614b1c5cc98d8757ce2a14890e1f1f547ff1 +size 199058775 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..63d4fa0e2935bd01ce0abaf09c4295cf41eb36f1 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ef4f8672e03f613db9ea2e33cdee58abe8c4cbb1f64294b6987c167aa4b986a +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fa840e82412ce0165200f05fcb563aae0e0a532 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5b4dc8336edb6fab0b8fc61718676a044bbf3cc203729c5f9ae341ef07a25a4 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..05ea729c5fe47c751450028df36d46ea6ef12d7e --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b75c4d5b42c44b0bc141321d0a2821c29f836dffb569ff326bcda85c333ac48b +size 199058850 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..50664175914d5fd027cba984c3687211c03115e9 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:983b2125e08fa25381007dca6ad3a7ae449036bf44f43090ec22f52e476bfb9e +size 199058850 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8e5c31e94c4f0381567535bb0d1fe49b2bb70e4 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3953c1b5146286e0ca4086ca5c169dd2b31af42ce87f7ec22f3224e12740c5f7 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc7e493546806b4074bc5492f9a141e6df134d64 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5810b02d237dd175c4194ff3e5c99ece1120b9c499017810b064e1b089411456 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..766fa334da0cbf4a8dd660b13ced820aa9f92175 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed551ad1cfa111319df63c4190c6d5caa730ce5eedb03341a385d73fdd704d03 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..83aefeabfa1bf8843b21c412a83308edf1716bd7 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53ca379d9fb82ff308109516f1bf8d7a86d432f6a0d803a1981a2031700595d9 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..03349f01f2595a9bc9f6367431bfe48ddfd81ba7 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73706bacfb353abac00911cca0db952132efd98f592c272635f130a33b9746f6 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1f7c92e5520b9efc56eb311927d66cdcd1c0c15 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20fe43a5780866f279bbb5beee3bb7b83234e934bdc2123e86be28d4c703a58 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ffdd37372808df44d34f2eab96378118b17aef84 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35447fbdcbc78c2a77c3d1a3dd57c42bc2efa68cd9cdb7b927198d3e6df86d29 +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6606c6f677853f5206f5a278be340be870a95b1 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab7b6838c99913a38d510a6dc6af973229f938b5718bff2b5e6412a1e7da076f +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5392ae9685bd9be3d7797ce4713ccfb871dddbfb --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f3b613b7db46bc6cfc2e599757b105930e1d0c2f2b2aad2a41be8e71eac516d +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7dde4051f9d3f8114cce1276e6f51fd964b5df06 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c57b16e2724704cdb5830205d554c2e1bcd21ced1d097a49cd6fb3d4c6344f20 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e219b7e3cabd49f45da2eed7fa290e29cc98b011 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe60b2e1dc2c809c7d7e616dee8501d2930b6db2ffb46cfef418bfb6867aba7e +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b65fa854db0d93504a9b5b804a5cd958cd0cb3d --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4488ce901f6dbda5bd97bb3698a9c924116994bbdccf2623d0f8e830d0145243 +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ba77f4eaa8680c07df753da77983e90a3b46115 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87ed1455b34cac3e8f003a1e62e8044d9322321b47112edfc398d12219097b97 +size 199058914 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c6e2031378171249c0c9210fc1d0508427a47b2 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3c4b6a7075f48299a665e97401575a14bad4c145e409f16c8b03c90e35a006e +size 199058914 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebe5c13c88a2676dfffbbdf63bddadec73071021 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:289b6afd590b7168632c542082d304ccf01f461ff47209e1e50636672a0df9a8 +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa6b258a86ca77b2db8b941ae85431e2d2385046 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a15996445815e44c7ddc2622bf6b19a299bc1db2b764f5efbfeed2089728c41 +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..70f99dee1cc31656e7a1a00fd39eac5330933a39 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6059a786f35f118f36422e1a04bcd1b04ba62a8526fb608e173d0e8550d9a57f +size 199058711 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ab5afcd5c5cfc86faf3e7da28da260597b36760 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb3e62dcbb8c26edfd6591cf11714c1dabdf0a55ecc1d8e6768e35c6c986c257 +size 199058711 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..383cc0b02a68ab01b599b450b334c890bfc0e799 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:614d4249ea8b1e4452bcdf72badd2964e46446c0fdd63115a16e679ce6dece21 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..061a0a9c02076415e9529a524ac1fff24b0d6e8e --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51b14e7256e4514a81d2c1e0ad1449e20032a955e046d4ac6e8f934d57462fd0 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f915a559935f43c781a53eb57c2f852cd5c630c --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd38da1951f994060f34fe614da6242b655de0197c6cb541492a2359b1045a8a +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..217b10b5b356244e2746f837a83aa822fe88e07f --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82c2953c039736e838e27095086830dda2df264f25bd1d0a95c53a09eae11d6f +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b21e6f73d8db1ce81825dd2c907796e08dacc1e9 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1170f48efd6c96a8c9aad351d4b3d0bdaf46cd015d45f5d9ab795e897c2fa55 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..91564982b4adf2aa4a9b5d31dc3c007ecc6c596f --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25e6c9f3c9328608dde574b0e40205dd0cee48d6ea16d5a7560002e9e5968693 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..87b8046ef024df59c50d8ef15ac67a6016f631a9 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcc12b1de650e37206df9b1ba73589d6e765d58b61fae6543e49566dfef4ad28 +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..92a8652a77eae77db7317344a39300f1c0d01e56 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8ea055a02388a9dde9bf35f79225a3ee90235e80c65392a49c8d9e50882ac42 +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..05ea11210bf6917d9e3774fc0ba59a980c0452a8 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a0b1feafa7a50bc0d5475dcbd750265c2b0344cb5e564b9f9c3a67b2255f49e +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..08d094d146e80e5f79b72fa690eaafb399d480d6 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17924584e91ea6b161f5cf5429d9965f7a604463fd7036caaf0ef896fd77883d +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2358336419f5ab2bc4f122a0e084cabc8ef3f97 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f36d8c1c36f90e544d33726fa512ae78b093041429623d3201d51080abf9564 +size 199058850 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0e97fa63fa0ccd4ceb84359f813105d6482074c --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c92aca621d3e66a4124415074781616a5d6ae88fdea5427b3021aff66ce095b6 +size 199058850 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..36328fdd084ae85da62a9bd0844150be7caa8245 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8dee279e75236b274179831cbf9e3725d0e08833dd8fd1b837942b6f5ef9f9e +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..49caa77b744338e12d0b9406552f6a3fda01c2c0 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f1184e4e26e733c59bab9309ffa3f690084d508fb2bbdb5970e2c6a334fb7ba +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..21718acef3ba49f094c7714a5e74a41b2622dabd --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d86ff620b5de0d0b92c9e1d18f81d6f441ff9ea70e7db29d366be1dc561ef217 +size 199058786 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..55534b06d06ae8989047d38378f161d56077588e --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bd149142048efdbc590cfd7bbaacc2639a9dfb1338f91ff99d37958ed279192 +size 199058786 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1842e04c1578f774bce79af0b7ffadbdc3f4eabe --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b12aeeb5e06728e8312dde1aaae0ffe4cff2754a3b9a5fb41785aeb43e04e10e +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0508e9838fd5e37e367ca6034603078ea599e69b --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf3b6934c34382f3450175fdb7a521ec0663e3188ad384b9b229484bd381712d +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2835b69839f54e1c491d4b592efebf72dc7962ba --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e48d7e2d1fa61b35a837af17f24969b1ab3f96e7edd1cc55f91bea3eb0f200b +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d29b3867136303f7e3f8dc97c2be7f326738e43 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dfc0d81ca10ab564645d067bb0ce838ace258bb8ecd868acaf9bae3b9c9795c +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac15310c1e57101b80ddb094660163aa14308954 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89bdb9f5bd71e55f6a678cc47308d6bcc0afff2ed90cbf2033d42769c0f27cb0 +size 199058647 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc83fc8324546a238bb684c2ca7539845c54a6cb --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c78c22692f5611dff8cbcabca4563dfa097f5dc591baf563d8c378029fccf02b +size 199058647 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0fce3afdd5e6ec23f6ad22fbd7f9ee30a8cdfc0 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1ca40c93412a0ad9932e65b354f6b8f22f216c1ecfb184b8483cb84cc130a05 +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc08f065f845697a5f1925a200062f5173a704f9 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b11f00d74ffa8842c09b04f9e5ec2940b2452c14523aac750c3546843940df2f +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f90fa2c5c19b2b95cd5d5659ab84b8633cd981c7 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c547e2f765411fc8361b1af2024078742114c0e6049e5ad8315fdfea1f79a56 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..672414e13dc5d366d1908e3d2ea3279938861a67 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1f76b4f8e33dc303fddb61a8387fdd485e2cf95e6209e052c5a10bd267b28f5 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..18903bbdb73bd60cd3d9c1a24fad6498934d7ed9 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ccdc407d1d33d795587641185291ab8194ef82a10252f2522c9347a339c59af +size 199058786 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b8337ed94e96212e5e2555b496c02b4f425663a --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccf5c9598aba6c003d9d4780dbff91d69cb5320285945a1e8b89fbc9c7730e86 +size 199058786 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2eea31f1149d8d4aed88d56bdfca1ff82d49a3e --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ed0d9b40fa4393a6bed6febd67b23b34d2ca2b470067616f9d92ed7845444c5 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b8719d74ae50563767018a33269ac46c3902b1b --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27a76a17484357874413d948712ac20932aef2de06315a2b979538a7be31f4e0 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6c9793747119196434eb2fb4371ea1faf84fc90 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9513f194a2246a8b21f88227a021ffca58a403505c04e8eb8281fc3776e574c +size 199058786 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c57014267d22f984b80a4852c60ba9a561eef50a --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f030c00ebadfb0137a1bc5935f564046f42eea5f7472e9b8e5858fa411f4566 +size 199058786 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5cbe7ad005cc3e48cd2303e39ccd9f1efb71d639 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:521ae99bcac64b94bada410479ee46d31ef192af6cb0a3537bfc94138a488199 +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..af28ed3bb60c2b829b8341ca72b416492a2ae456 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3394933882257fdec711e8901a43fe1039a5bd75354eb4054aea734cf0d03136 +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..deb0d3b5063b86f805c7b079923bf7efae18d098 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c34305cfffa70f7d10c4f6f591d994c9427a1ac8cc02dbb37db7de09375d66d +size 199058786 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..250f72bd0a491f8b95b0f2fa8cff607e2539e412 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a399e98c3158803a9b307426020cec9c6ab87ba21e981924e67a234924473719 +size 199058786 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec635dbc80c2bab7f3539d08aefb0283a649243f --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fed93e9d3623058a71cd8bbaf801577c0f337f2293857b6a8f898b4f0770ec1 +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..95b2479154a5bc7ade8a7d769c249cb6da0af96f --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:581f402ebc8ca834638d03dc7266eb555692da33aab096e086218fc5da1ccddf +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e82aff95859566e79ab9207f9251a51418abeda --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf106447d0fecc1a872fd1576af79545018bebc13e0bb8486b91986f53fc2c1d +size 199058786 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5df2885b7d51aad908c9aa928cfc41463d1ed9b --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd8911f5bc7600c4049fdabd82b708beed9974f7c504c4d3f1a90b84efc713eb +size 199058786 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4ff929586e828c80305108702fb86217a94ca5d --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea0de94d8377d96e945dee9bd623993608d39a3b0ba556e61d8c46e89406106d +size 199058786 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce637455706d6973a657fbdc9d70a9e807d04874 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fe9e260b179a0825352466630cff0f3a22937d55815d0ec7d68ce9988d7c10e +size 199058786 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3abc11f1a9b0bba64177654ee9878362fa13bf6f --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58cd4885cd272101306bf67029d8cbb5c91cbea1a927df7846cb0e2afd33429d +size 199058647 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3e0c76be385c5d43a63cc602f29ebf416235a09 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57bcbae6a36b21ebae42e58491fd49b5440c4091856bae1c07c6471320419831 +size 199058647 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8149de219cf7a101c1df56a92165e8e2935243b7 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93b0ccd91d4d23f9ed00a3ff6a9bb7f9a3df0aa47bcae6ddb5395515cf5c6d30 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb6bfb92850cff03a132e63cee8ee082ab3b3f68 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b64dd15224fcc30ac4064e25685f5b378b5d6ff2fd6a152fc7bfa112095499a8 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb608ba71978947de5ed54fd0fcccdefcd5715f5 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05e9b7b420461625b0d40e5c88937cc36f7bf113b29cdfdee28f9baaeb732461 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..34a646f3e7d6feb6412b284bc77d5d74461c6f04 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e99e8496d28f6e23dd2c8844061eed1cd597b1f66ef2c3d2f4f921b9e7c8504 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3eb0bd751f1ea2304c37ad0d98948654465fc6ec --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e97d21d72082739739b2c532dba7d5a677d1cdc5804b61e5887f6435d86da9e +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3fbd93ea41f76973dc72f6e98fd41af9dcf153b --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eda04698c4f8715339739ccd8c4c2cfce592cbb67eb6f47ddf9e804e21a23c0e +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6fcb238c3f2ed90e7aca8c7fbcacd565484368e5 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9e58b07f879d257b7f954b20d8b297a5dbefa3b4d94569e233f6135716d7041 +size 199058786 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6ffd6932aba27797e88d62cc1f20df093f04bde --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4648000bbb81d995fcbeeb1b0d739c3c16edc00048d3ddf9a5e8cb478c94e471 +size 199058786 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c337cfd5c7c5135667bdbd82c66c6a5090fad8e0 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a0a333a45ec3d43f0efcd9e152657696cf16d27d0e72271e8e9cb194ba6c2fc +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2a044342f2292697352d95ce5c088e07ee3314a --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c24ac4f5fc976c458415c0186d9734afbe95f4b6e7b16441dc47ada633d3c41 +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f16d6b76cf8b58b2c2f6cd1525d1d846de8afe84 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4658a6bc46090f5af9fe703885d1b6ef5bf4d8fbfc9d55d564f813a92717805 +size 199058786 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..39861382f3091de272aaf4638d644a665adc892f --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d34d1cd6617c3a6f10568496b80539bdbfda0bc20e7242779a64966665144f04 +size 199058786 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebc403c1ce66afc823bfc83445baafb77009ebe1 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92ca5e0c28c0cd570908b3069f1c0e0cb79bfe5df635dfd813a0bcd2f40f2b31 +size 199058786 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d5f430d34ca964fb984435ef5dc5fc684876425 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aefc6d93f615ed070654ca88439a54e36690e55ee8c27cb6dd50f0d41102796 +size 199058786 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3403cccbcf3b0665fcf289d1da68f95ab82f2200 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cbf2d86c79b106ae1b75f57b32ce2071c5d7112a5e70f7bfe5caf7011c678a9 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae756109bf33f28782d1076e5cbcff29d6b93675 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41d144711aad637bbbe5a6c8cb8cb3aa9b0c2aad598699dd658acabfc6c5efb2 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7005c10c856c7efb76cf64e413112d1e22ce546b --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc425af8bf99d256f683680ba4337dfe1259f2d7e9163ee516f169421df90145 +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1721521874d9ccf7a43e0cc22524224c9c85af6b --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd8faf74fd2cf98bb22c03d17f82d7ef3d0258c5a3178c19a6d73c71ec161e40 +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f7e5a92b37e67b9e520f3ac12e0e0b61f49ff61 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a792ec332ed54056913405b106411d8bec4cd57bc95c576d70d3812b600439a5 +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7cf3aa541945e4e9eb0e966015b2aae63466bc3f --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:236c71c893f50577f673ca51a95a309914775ffb1571b3dc8105102a45a155cd +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a250f3cdbb03ee0722a9fa65b85959f01e4504ad --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:126de4966658428cdb34d95689e5d26b0055f4c9e78a209bcb02a2312abb0318 +size 199058647 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b1f5380f03df817a77fea3f50f1e6050e2198e2 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca25b9f313196ccbb4835b80fb99b4181c61a6129a3d8151bdda8cc84566f3d7 +size 199058647 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..83a473332071e7ace596ecffc65b8f2cd75671b2 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3d5fb158ef3a03924ec45305b704bc39296b7a648a99a3eb12d8cad230e09b0 +size 199058850 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..93c958dc251406ad3c7bb2e5e4c16bc00d965bb6 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:706e8265d94bb13cda06b15ff5aa6be705ca42b953f140a14a00786d62b22687 +size 199058850 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f950b053daa705b8b0cbea7dc02cf2646028f32d --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7417aaceab2bb27be0b5c3fdeb27fa72be736faf17203119ce86daefbb0b760 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa13daa4772d92d08a38cde5805d252392a3ba9f --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37235f002e211fe2183ee63bcf13413482a28056c77205464f47a99080441558 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad44525c72f4206b04fb87ade0b55b42dca3bbea --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02d4239bea06f8b9c283becfe5e9e887c84cc8d9b53b64d48cd7c3b3e36f4490 +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..70db2198c576eede6555c52c18fd0f3f01a5c58d --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5ff5b0df734c0011349331bc006055566926e184ed472aae596fa897b760ea7 +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..246ca39d668ed9b813b1afb533af1a1ce0c71623 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9c8692b572b10e1de7f0fef9cf61368a38fd7574d7c580e561f7459416eab31 +size 199058786 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4d41712d954af402bd0fe16b49ee8c553e6f526 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b56588e4b15807eea397fe72e3949ac263ae3259561dea35c0a6bad63840c5d4 +size 199058786 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a403d3966dfb5401e9e91f843fe00461cf7f365f --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0bab3dcacaa52f17fdbe64553c51bde7707ab2413d46d4da8e0f9447b3041a7 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3dd5cb89760cb9c2fe5f24797e3836f4fe53b126 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a04e4fefd48ef48eaab7ab592593846e7b80f8d56ad27c53a06b814be9e92ebb +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..55e0eeb37a350abc3d08ce13f0da2e4386a6521b --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e7ea10142982cc692898bb226caa761fa603cc4cfe960130c38075178cdd072 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1581ce978865b0d17777923c41fe24a0b127391d --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01523a9b2303e6cfe0bc19d1557f688b536f165e4852a8233859c92e18cfb8d4 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2632533ac078bd86a32fddaf6e252dce6944dc9 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2067cee0a978fba5f82eca0bdd0ed24680422f4387b9a4fa1c015f3c7b0f024a +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..acf3110e88e918bf9ef82148e66d4f0bff6aba8f --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd57424e751ee4e7e4756648f944a207f5b60d033997a1a2e90c65e5acf78f68 +size 199058722 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..30bec1c0ef31c88f3ad7441cda12c22b46116e49 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a5723b221e51777c75ee9153e4bade6de93856fa15d840155552513987d9e3d +size 199058786 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..37b56c67b5dcdc6559a3a10f9790a1aa89b13525 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:305a93ba6c76e3239e9f838e630c80a2f1feace0b41980ae062274632521ec5b +size 199058786 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bae3121e90aefc260ddd8ba003eee5221cf7d2b --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:947399dadc930168e9ace33309515db96772882e8f24a58769db9a3cc5fc99bc +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..393948ec38adb5bc283e11913387b2e12729afe6 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4db256f90472344c4a2672839557dfb53d45d4332e1ece90d178ffcbae961700 +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac3c3e88f1636ad5e3b82890b682cc70e6a7c171 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9388b54eb83cbe0248a42c0fa9daf7e547b9c7894c565c7045990789c0b815db +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7bbb8e6a34b7a23a6fcaead67f3516da345cec2d --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba19ec14b2f874ae5784b627727c2d68ae79f2bcc1368b31478e68c49445f767 +size 199058658 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0cb8db65fd8580af1ba031d755bc52055d41e251 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26c6f7092d53b0c0ab7ae3b4296b09d7f0f63d1e43e1942af1b912d47ca6e548 +size 199058839 diff --git a/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1f430320b84b68a0903adde88851805c0703bf2 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:389da4375c391f6ca2d32195c6197eb4969895c4ea5d41282af4c05c32e3c4ea +size 199058839 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_01-model_00-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d17d9cc3d0e9fff9c3e81fdb47c7698cf70b9871 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dd842a28b41354a4eb3dc094b4356f02fd724a2195ce91c32b745fc07c08a30 +size 167511299 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_01-model_01-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_01-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..feae16572706d52faaac61a6f7e3bc13eedd52be --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_01-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41ac307a94a9103d4aa0fb37bd463bec341afe0de00258ba51d9c3041ba8e2df +size 167511299 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_03-model_00-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4552a0c158af8313bdab7b622e1496600a043dd4 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc3236f1e0f5fd9f4a0a8c1c05fa3ff1e03761f7ef2e646a8e1fddda0ff0670d +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_03-model_01-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_03-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ef1ea94442ecd60e573e792b3065fe1203ed4f6 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_03-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d076f308c2309c72bb2615be7d19f0d18c524a7e3d9f7cff8c45877f4013b806 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_04-model_00-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a2948b914e1375fea74ea385afe0a4bceb3401e --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f07b5735371fa81a7f497253c2d3a6c1edd2b312f63712768f1f71eabe21816 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_04-model_01-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_04-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0dc1dbee52835e2ebdc9cedbae8f5f83c2d3b515 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_04-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1270970a980d16bb280af6f07e615acf8ece1fe2c98af06e84b44d2a9f5097d6 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_05-model_00-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bff12b08531a79da140881f79f348e2b1155af4e --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec7fcd836d5f250ffb2b799c55f72c4de55d98ad2ffebfece33add02613ef64b +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_05-model_01-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_05-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a50f2de539d0b81f7e46786efa196799d1131b01 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_05-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1876e418f370e55bdf1270632fa9093bfd44b0e2aee8562b839a540c25081223 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_06-model_00-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfd0191605754d36d56f6e5bf1fa40a0a7de96d1 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5de7aeab0ee10a43a6ecd85ef2937b9edce3119c4faccd3d90a92be9194dde3 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_06-model_01-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_06-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ffd8cab03c4f9901c000d512c4841081fc38a566 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_06-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6301cae56427a3b2f919bb17d8b3b62ee2319a62324acb83889c364005418bbe +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_07-model_00-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6385be766b3e8375be8a24ba4dc26092e3065e3 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8de18ac7e8eeb13fe5c267b6bf615c4a4cd14c8f5eed14d8e87c25629f9505f +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_07-model_01-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_07-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09995f099b82a38387a347c430f1e065af016a2b --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_07-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffddc60818ec9e70cff4106b93c6e971daf802fae4334a6515fed832f776ccfc +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_08-model_00-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9803804e1e9b5b2d594c32cb313c97f8a057748 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:249731b3613ccdf3d7a1df27545f23fe0c825b3abb593658c32823964a1ec717 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_08-model_01-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_08-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa268f4653bb866079d15cea3ebc35f4760f7c22 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_08-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:814f60e2c1223b439b9d4cf9b705d9a68068b747bd051484bda009980bef663a +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_09-model_00-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d3daa021176b8cc01e30a9ccbdd171cad336dc4 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a62834a4d6f2f836d5e239af818296d7f68fa81af42c6c7d1bf3e5efb38cda1 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_09-model_01-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_09-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff96410463aabc150f566e6b6bb620ea715bab40 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_09-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5e80df19839c9c517aea39471350721575f9afca5ec9a7b5bb566f9f88f0299 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_10-model_00-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f61603edf0eabe142a19ca9faeea819963acda3b --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17637440aad2b66d75660b52932a69d9fd5b7102fd673f950844e30933ea2433 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_10-model_01-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_10-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e18818dce1dd1182a6ea3d7ceb07da25f2041dad --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_10-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac0de5ffa28196f8ade990d346a4073ae12d2be1723a25842369eb1e06cd0f02 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_11-model_00-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0aa77566e661c08f2425882fae86fc296179ebf8 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a7023230a5a7e2a9e949f291225de2f4a60c23cdcfc2a5eca5eeb6ce90eb660 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_11-model_01-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_11-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c277e5774d263c4704205994bfb5ac683dd554e6 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_11-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d128eb5398db6f5271a8b64309b49b74f2a5b209a9850a5ba7b72ee149eb4d2 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_12-model_00-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bdb6eefe4501bae5ffb5b547566d671a737ba75 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49b6b2ce274b01f755a9e42c8b271c93edb866ff7758687645731ae256a0092b +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_12-model_01-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_12-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7feea96fff333fb1034262f3769302d12da2265 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_12-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05e9524637e21b0244bba2733d0a98f31d1fc4f0d9dcf23f5e235784d1d90dbb +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_13-model_00-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..585a26c0674cbb8d1e7159753a84777e3d02c38c --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df40e30c2a7d6e3fcb0d00fffa32707a9f284fd9982acf609d123981ea6aa073 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_13-model_01-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_13-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e74060f88dc0e582597c3cbabef9b0991cc91a8 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_13-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10bc99cab28196ca139c0d0067caa2980746a18ea62520343675e9630fd44cbb +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_14-model_00-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8364049d4a1ec4d856dc296d9a66a4665d53d733 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84bf5dc49b706f309e840a937ccd231ee7b5bd0f0123654faa198db5bdfb8083 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_14-model_01-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_14-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f85e1ebcdc742759b3efa005a1add02c114f3ec2 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_14-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e3245664d30db74f5980740f7d59d060d2602846a655ab8f30a7be80cf2d2fa +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_15-model_00-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..64d9858d9f7972f120bc5ea5912dc3aef5af2166 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:870bd452afd72b437ab028a7f32b7e1918acde97be9cd85114fc3a264d2c509b +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_15-model_01-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_15-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a32b8b69b55f0def3f2c4a3a2cb9d8e81f8e3036 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_15-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0719830440f802207ee684ed8432108c7a7d79aac47f1975d1629a8469b2e239 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_16-model_00-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c586cdfbda05fa38dcb887e71fd2ab05306957b --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21285576dd55088395b94d0d4ce92430e57fa445ba18349c94e419dafb3411e0 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_16-model_01-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_16-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7ef75801c92004104510cf7556c4e02e0c3b2e1 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_16-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:724686fce5c9a2d67597a59e7c6f62f3d7a02c49f03f5b1184f36ad62c095e40 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_17-model_00-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7443a68932600118227b5e90f32edaddbe7ebf40 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed549f8e2cea6371a3c495ca010e1e19cdb48a33ebe2cfbf798932b2106dee32 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_17-model_01-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_17-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb56d3b6592b3447215f3b4433b90adeb12147fd --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_17-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c068b56eeeaf4e1f12bd97a3c67caffbc1a600ba384f9451c8439cb77c686c40 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_18-model_00-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8aab391528b19700e4fc76c029fabb6b73289a05 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfe94466ee6967d1205584e9d9d4cfc168da6dd594e56752f7ecded14e3a63fb +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_18-model_01-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_18-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..62d986bf5aeb2875d09117b0799ff528ce8baf4b --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_18-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3addc8e2e66222cf18992a35ed6a68c2a34e999eae83df857014442faf855775 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_19-model_00-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ecfb45ab604db93401b9237ef9d5c7257028c81a --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:177d40a24155ba51ac9f1f623fab7ef660ace3f3d153c121a89557182a0b04c5 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_19-model_01-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_19-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..056c4a2145e4e19a281c9724840ec2ac0ec68aa7 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_19-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e12314a9f3b14caa0116d6d5d74f95dabe15f72c79ec0ed495a802d3bcadeb5d +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_20-model_00-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..04b2b08fef778e967619f353c2ba58201448cd57 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d52f3e4e7b3e7a7a7a06c3b046d5813ef04a5af12a297ad8b0428220873464ee +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_20-model_01-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_20-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a60dd52a48e48e20e63dfa9080b0c3d908ad480 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_20-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:033b1dab5ed3d68984c072e74d7c745bec57de95e5e8ac0b9218bf5d7e2e54cf +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_21-model_00-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1054d8b1a004a830fbc61ff3f9f4a0e9de5b05f --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc2228f5f3c96833fd102776afb1d9504b674ee41462535f5f87b6f4e003b220 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_21-model_01-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_21-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..848f957f3a9ffc5c82e51f586a7c23eba1f3cff4 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_21-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:276aae3b9e17736240bca941a5ca1ecfc1bd2b7e425eddb70603ae5234dd0fe6 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_22-model_00-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e676a92e52a43b2b3fa50344d1d9f72e7e298b8 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3567acb0e3eb86ac11c7783647c92a88de52abfe647f3122aa67d54b6936688 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_22-model_01-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_22-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0a6e399e92b2c947cacd3eb342026392fbe60cc --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_22-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f490a24a8bbe718b1f6084a3746e46446f8ad50b1999aa3d35767140207d71ec +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_23-model_00-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..542d42ec7534381190f4139c92e2c79724818233 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4bedf59327a391811b675e736233183460247409f2566ae64e00a54bdc074d3 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_23-model_01-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_23-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..75c664bc3106ccb061617baca2393892a3710555 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_23-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b50942c556764a4a9cf7d3bfddd6cfc2727995feb1f7dff24d704863d15ab3f9 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_24-model_00-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e645b0ce2f5f8eab15a96d223e1b193a73987a7b --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9da4e0ae6a8efad9d56fdb65b4c954b0132ba62f0e01de1f50490ad39e9078b8 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_24-model_01-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_24-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..290cd4dab13c26c9b910a20720ef1f100a6b44a4 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_24-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe2d3a185713f157bb04554557aedd4e3c3d0404a393b028f74c6de447a2e591 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_25-model_00-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbd6dd18c38e2e5a2e44f1c6f3ce66c8dd52b80c --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1be23a4da9dd17f1e2d6e276aaa60183336a85eb13f48e545ca91099677131c +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_25-model_01-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_25-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..658779e223e3b7985725d4fa1eb7f2ffe093e47b --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_25-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c0f7324176a1ede98091ecfee158a24a19ac5a88c1aac3562592a61d14a1fe4 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_26-model_00-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e62e3c214063bc82d78b0578a19b457a6a7168a7 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f88ecf810880d381022ddf3aa8c650fbf7d40523259a6910747aba4f8e3dbaab +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_26-model_01-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_26-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..94982b515165d94d6b1d616142145fd5b6aba262 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_26-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:accc941597a329a706fe5c6332a49c9b14fbb06f5ddd29943a4bc47816c9df9f +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_27-model_00-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..465c484150c8f614cc56a46ad45de69c10926ced --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12abf3701b00aaf6cfdd9428b19884058fc2366cf13c11d73d893c433d034c48 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_27-model_01-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_27-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..28971c4298b2be369910a8dc82d0fb1c33d1b7f2 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_27-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bad2a1184f3949293129a518ea69e2c45bfc28835c4a747122bd0c36de8cb250 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_28-model_00-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..df0fd60de94bdab3c6fd6bb02d0d026319fdee8d --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:107df66d3f19ebde5fdbf3b4513be557080ae734261ecbeb072a348f6e1c1ca7 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_28-model_01-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_28-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..91b22e54ca49a5af2f4a08efbb8ad2237267861c --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_28-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b7719c932163c34c9172ca8a638415bfea02810264da2a1d79c7f7e13cf4781 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_29-model_00-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_29-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..792d92ef971e1bd9afcb5a0db06660d565f3ced9 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_29-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ee8e1ad54be7440e6ca878e7653099277c8b941c2597eaf73a76c44ae5d8cbe +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_29-model_01-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_29-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d05f097415a88e81fa5ef7e17771561e6af59812 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_29-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4237025f894ecf118f8e62bd1de32325d9e6c2297666ae8762dabc378e370b2 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_30-model_00-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..486f3fa64a43d3e85a453b3b254c44bac308fd3d --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d6f725f440cb58be65d9b8399e7831fe190f01547ae3630c139e60bf51b6290 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_30-model_01-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_30-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..372873f77460be9ea2147f0cc2372eaa3de24b17 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_30-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da3029cc2e6d3a6be5eaa75a2ab6d7ddf0f32f61dc1404a4fe3c629274c99cd8 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_31-model_00-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_31-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cdc4c08e7dc55f2f32b31cad48f6670105146424 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_31-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d1a5ce98805661fd68da3e7b343a1ae3b1e136a4094a8e4197f015b20d8bb7b +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_31-model_01-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_31-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a0cd7f3bbb9f87889d13062ad88f0f0f6543888 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_31-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddc5dbc4f0fc2154316d7f60d301239cd1279fd8124c78d141eaa184df03060a +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_32-model_00-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_32-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8865631a55c31904d36ef27bedda4655bfa23eb6 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_32-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89a3b3b0d74408648e8651e1ae11ccbdb69959f3587f86bb697a689282d78d83 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_32-model_01-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_32-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c502666d1f862443d3be6d69f5babed22814a177 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_32-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e312aad5e1e65f71a16e9872b3e7ad5e82dbdacbee72278be1981dbb6731fc6 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_33-model_00-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_33-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..018848199b8172b1db88d10a84c84d4df1613823 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_33-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ea0df4cc8b08298425246d0b76da9cb69d2e3958b726d3d0603b60aaa36a53d +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_33-model_01-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_33-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..57a518f2eb7217fda7e5897fa4cb6f65c0cf016c --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_33-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ceab9d6199575ffd847bb1ec61e3b34d1e79c5ccf815a8125ce49e1d9226dcdf +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_34-model_00-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_34-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9288a6dd9930ceeb331cf501b6cdbae95b678210 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_34-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b9b2bd9e2234ac270f5f11f7af2365b8daee53335077168659ff40cd02c8881 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_34-model_01-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_34-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b710099a06f7ad2ef88568039341615848d2db19 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_34-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:207ae931f81dd255528c4bc0a8ad7f1255449cdc45a59aa23780d2589b12f35a +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_35-model_00-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_35-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..50b8406b2deed8483f9d382ad56582073af0b098 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_35-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4012478025d670775f3ca30d627fd25d13dfa3c9fe47e298e429c44bedf22796 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_35-model_01-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_35-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8550e961bc5460e63bff5d1410c35c5fb02bb1e8 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_35-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bc7560f611bcca69eb6ade0baf1298420973bfbcfbb74243477f192fb63d162 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_36-model_00-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_36-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3017bd26ef376a4c8ad427b34cb3763feb1b18e7 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_36-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f2695b5c26f23f006e313a318793bad1c814325def7d5b6dd6665c5ea44ed8b +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_36-model_01-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_36-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1fbcabc80813897bc83c50c513a12d1e8a99ff3 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_36-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17d48f31ddb2aa2d637a266dfbec4c8618449aceb3c75be9828f9e3ccb48c56b +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_37-model_00-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_37-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..af2e7216d3ad082bc60b1c2c900a65c8453a931c --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_37-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:def484b337569756621492cfe3ff13d349eaf6d2b2cb92366469dcd542282c74 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_37-model_01-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_37-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7a57d0ade45a4f48cbdcc830d0885a8dcb8942b --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_37-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eaa5f9743c551fdcd7e6eb6f88066395f735d79ef3709b516fc3f6372e403a53 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_38-model_00-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_38-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf9cde390d35b8e4e0807162285228216caeac95 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_38-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6faa5ff080ea4433950a8149008e9fa3cba568d8792473ce2683fd1c2933ec3c +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_38-model_01-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_38-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f672eedf5b4dc568f8570ea77b51091b63d3dc9f --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_38-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6dee1b581bdaaf3c1111edb9a1b8f575bf55cec9a6568cb73d5b26183c3e2ba2 +size 113308931 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_40-model_00-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_40-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..502048237b32b7ef1661cd9bf6bd95d8821b9c48 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_40-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2023b81e931801f90d32b57bcaa3abde1096f0627063a5f5c321188dc47a15b5 +size 13507 diff --git a/4b284b84bc4v2seed1/global_step80108/layer_40-model_01-model_states.pt b/4b284b84bc4v2seed1/global_step80108/layer_40-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3a6d05d718c29bf0a931809ee27e131d352de7b --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/layer_40-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a46a58788d39ec7783bc1425b051526efedeb40260671b241b3533660ebdcae3 +size 13507 diff --git a/4b284b84bc4v2seed1/global_step80108/mp_rank_00_model_states.pt b/4b284b84bc4v2seed1/global_step80108/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..56cdeb50d9390344f9c1af647f73f10c6e0dd897 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62e1db898f8dbb1821f5bd3c6a8b5960b0deb8d0bbac08e52047785a5a8b8be3 +size 51507 diff --git a/4b284b84bc4v2seed1/global_step80108/mp_rank_01_model_states.pt b/4b284b84bc4v2seed1/global_step80108/mp_rank_01_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..65942f6ca2e38fefb0a51dd4137f648acaf50d93 --- /dev/null +++ b/4b284b84bc4v2seed1/global_step80108/mp_rank_01_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86b18743eaa2fb1e8b2c64998f4f7d4c25e24fa82662aa70514f42e42279c3b3 +size 51507 diff --git a/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..0b1162d55090a28e6dd30b90461ca34e4d3f09aa --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.4561902687825146, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.045631246828587047}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07625749807589129, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0015146545254109735}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3307426476163128, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00456779888031621}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11679844154672582, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019568915949739994}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03608151986203413, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009254470422146193}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.16229717802554836, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0032223185692842058}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.0554093381893294, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012327294395014525}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07353494344552397, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013741278529976802}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3230730872507571, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004482961394584532}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.11311445429105703, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018346474985473178}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07303744482119352, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014379306638165714}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.31705954495780236, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004318803443289957}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11188332112192871, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018465577738166203}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..22ac0b010f33ae7d0f7071558a9ba41bfd9266f2 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.5886516458334025, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03717726878870121}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.08026566053193719, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0014159639116614112}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3942157437513017, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005461079688404384}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.12548839335267944, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001928881826547231}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.038000879190334146, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008787103935280456}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.19923195745941746, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003907735021234661}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.059755176813484405, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012347079912433854}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07552316506586856, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.00123012987736281}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3738994305484677, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.005048426209720286}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.1183744839063624, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016906391136317978}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07603490019116672, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001311880863082997}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.37313363669466976, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004995079076932912}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11887135903817798, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017838888979302661}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..8a6c64dca38c063a25c33b77bac9ab6c1c31ea48 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.6600722092729007, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03519197756328506}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07745497341270637, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0012346921599162308}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.41190076505770906, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005377825981214025}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.1228359376509253, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017091878261403075}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.035903159669296886, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007708405381290396}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.20783156644312073, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0039023098470249125}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05732608605259917, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011019893164004922}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07197458828228794, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001092373974273461}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3823575589838747, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004836437439878737}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.11414361148332351, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015117695102111128}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07349628109207673, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0011632716540392056}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3899929430530594, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004966781612279243}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11649612591713067, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016039234092463776}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..29800da54308a4a898a57e806d444abe65c2ec73 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.7938690838487434, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.031249006432413233}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.0802242746933909, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0012915264518391}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.432425410033066, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005388624217576616}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.12765986861457063, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017842279285890702}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03742102127943016, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007953067755003365}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.22000051519312314, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00404703168782795}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.060003612710909315, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001146664477215343}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07327312156062743, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011113752501149396}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.39487814553889183, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004737789640173793}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.11660022195969111, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015332520691398934}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07598267078545315, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001204590796246913}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.4089805013247068, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004967802237281888}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.12088469182871771, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001661523804555607}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..2a5fba0a9ab9ddf696e69423dbd18de3b04ce598 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.8218123055098046, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.044246313732840256}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07753724548278816, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0011900746777565759}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.4341910857165979, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005446504875155181}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.12410661735510435, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001658918514736671}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03630893474019336, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007351259548705939}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.2243388369397611, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.004106316366094987}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.058623697481614896, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010716614020870505}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07062282112602274, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0010428980489891116}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3935550435860648, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004760493217032566}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.11289953851936033, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014402500630831217}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07330274436223451, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0011220316964088218}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.4085243199495146, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0049771427706643894}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.1172028966984663, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001554404781749481}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..03506cea2df3fa466a33901ca33638a194448822 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.913925260231582, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.051763978663194966}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07874146764038398, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0012134560937164121}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.45109520601285813, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005553088446218645}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.12641834793897835, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0016320788274985598}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03656608773889105, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.000760846094550187}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.23230496648757598, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.004227400481066823}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05915409533137278, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010512753815705362}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07104014696908037, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0010444495191682013}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.40599373509139014, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.00482831666482983}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.11387146771889235, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013950097533787038}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07423831821118593, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0011248214939780865}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.424873549364599, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.005112245054065837}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11913823061282955, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0015199756969136377}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..b43ed10f40ae87b6e1336586750a41f5c38be5cf --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.1490543596959789, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0019546229536216812}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.25389546448233424, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002741124482183061}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.1745670903777373, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019234371005345781}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.03016441545474279, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007719528814370501}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.053419440384246994, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0014288658559341756}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.03547451018256482, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0008627729378350705}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.11627822506127969, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013862347099417346}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.2054884045718469, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002244877757105672}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.13785667531218, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013936984378312576}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.13663769110467477, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0017798375104242446}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.23440517613484713, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0025460475763855804}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.16028302243607997, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017474929334903653}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.6235229126061184, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07158856142385593}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..bb203bf9150f4c882e9695d23f4be6d56fc36638 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.22331912988940492, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0027687942933625823}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.3105879084943194, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0029250201802578303}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.22808328022499394, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0020320515676967767}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.06014163619235408, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001549861456149217}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.08133586965727622, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0017304100412085226}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.05894457560206053, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001148762569744268}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.16233563631626566, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0021600975326785993}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.22817247618168887, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0023092419967920526}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.16440728290895265, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001417667346489937}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.2095322539144404, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002623522761491815}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.29186247430489015, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027828596792989963}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.2138081154409409, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019073843040340796}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 3.148014517976192, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08632853762954663}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..4f08f418ceec2981ccb979d1a184e3fa12af7dfd --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.25284242615549224, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003346416305554945}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.2985206799819407, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002872417745008737}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.23269927040845031, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0020394436744448855}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.07352861081692932, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001975577012025009}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.08045188272326337, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001687564851802267}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.06308783765355935, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012452038663643937}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.18896530779163317, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0027402813839447243}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.22165381331302203, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022793478208025125}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.1711468063140619, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015216107571068406}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.23906918273035027, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003206715750850772}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.2821026125213223, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027371552638994733}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.2196667775453629, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019303318209296886}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 3.648405351452855, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.12713119304572523}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..397f5a83b5f3aed3160cbe5191bba717590df071 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.21412240705416308, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003573906850229763}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.2363591035613763, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0032427476384113535}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.18860588124930222, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002411594336470169}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.0620187002238152, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001908345830156357}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.0644931653305227, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001637056221909264}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.051285956226699604, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012327125521204533}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.1623855639995828, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002892414171534976}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.17796581661301386, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0025623361467453773}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.14052920532911936, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018198320452371584}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.20310628745671855, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0034230022998127862}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.22379283876686262, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0030762140186834028}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.17844826504839648, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022785596409348953}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 3.6829199554261502, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08848427999980182}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..9ee5944bfc9ee3d66389270d079da05d6bfc4011 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.06596988964164227, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0026452643433214004}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.07786694962495821, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002793778795842796}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.058680633472697495, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0020527112852523396}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.018662630886825272, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0011852493101770921}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.021659652341736273, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0011776028400838929}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.015912520231271727, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0008257625671288616}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.05090308576277237, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002121767282678217}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.05971715204113024, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002201135080103992}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.04448068031172814, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015668077231183733}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.06266723632734954, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002537275263785622}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.07362961134314913, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0026439669964067034}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.055493537558428035, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001944192579335498}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 0.4977010788321425, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.029197504340406147}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..f4adb3e7423c3e2c5556571f8a4d749ea9d08957 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.009347302370204104, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0009939432842913038}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.012675375103590819, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0012741296212300682}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.009019405424799239, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0008796953070286968}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.002520125545331128, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00043890835709493897}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.0034745962063106794, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0004926837590871648}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.002459973367560091, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0003520874137724776}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.007379431863883617, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0008249510021821957}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.009772980431375072, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0009978936334822926}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.006955043299953472, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0006891726751168752}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.008880786469979814, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0009541098770127502}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.011981285756158963, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0012073677632838248}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.008527269899079934, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0008337482953004597}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 8.62147070684518e-08, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 2.4998412186774315e-07}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..58ca6bbdae608c3290fc618d5c768bbc06348a57 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 2.5190605487649087, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.14578061564278902}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.12015610790826121, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0026013907575401264}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.1007142822326354, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0025699976738232087}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.08785204369989494, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001909841985405621}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.021978597704618782, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0011061787510217053}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.026856846878022297, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0012249926502431994}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.020631873410295806, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0008986868448192905}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.11432207717597319, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002375152014750786}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.09673002538661275, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024476967854968764}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.083870708743602, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017764834490443292}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.10920558363229785, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0023563322630614446}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.08646567425286227, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0022239273238183668}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.0771386142988915, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016644247241633418}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..9f39b05d2358978b8b016f2232dec615f0f67077 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 11.471305506037798, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07875003513092577}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5170379371586666, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0033287522955400954}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4239211672299534, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002947218737469124}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.43708472576518986, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.00224171007536442}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.24177763061210847, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0026337382842525014}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.1931046855790191, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0020767023449716755}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.19998119743920914, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0019048339787913725}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.3792838934227107, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002982844793468976}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3062355213393646, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0023427585826778815}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.31725506977900303, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019449957706219145}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.42712804511272506, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003164747958067866}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3486090540172501, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002679539945997737}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3599294935860651, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0021823306634720274}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..58acbbb89445b04430ebbae080e1f068a199f955 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 13.980968022690044, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.21821573679070036}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5445902709342957, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.00337974740434529}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.458944313155064, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0029017981497803163}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.47004796009089583, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022258968023120985}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2713453392654981, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002780199873202826}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2245350505416365, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0022393722057462194}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.23012493273504447, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002033859795223151}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.4018381948627221, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0030321901639654486}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.33679603771757866, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002478135715528108}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.34524196268248847, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020571216808165926}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.45423494017342136, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003233814196249404}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3829304393507027, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027623882797974796}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.39203827558400783, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022732280818521912}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..ebba357c158118ea10fdd6baa153179ce4270d5c --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 14.154980307761505, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1448658074579454}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5290233700279933, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003286733532241089}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4695155836113227, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028589858065198362}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4705643512917158, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.00214940659696796}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.265538771393177, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0026553555632510255}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.23270443394551238, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0022448787273333173}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.23283631982568367, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0019771157251113228}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.39229315419704086, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0029631232557498915}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3458978765243631, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024472277771961978}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3471376353301056, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020102129845005895}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.44487893090959907, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003164337474810978}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.39451585686809876, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002730627600611841}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3954525442177938, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022179179708118656}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..183e3e19b0d9869b35d8fa138ac8f8e2c1d64f19 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 13.721038666752582, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.17683442815246456}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5089881039212353, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0031941598167466606}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.479032657967036, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002765675705775823}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4691628743032071, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002144459294602491}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2551097554402564, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002576496565725004}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.23713242535420967, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00222316717149407}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.23219088772710936, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001982880603357365}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.37390882033029804, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0028070940255931595}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3512215949214737, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024022657027433863}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3437342989792434, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019737589675455874}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.4277340821604659, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003042188683426346}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.40285522466618634, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0026869688850980986}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.39438992601573425, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022083897072610196}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..e6d65af35c4cdcd178d3849f3a647b0f4f2c710c --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 13.685692148533645, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.18475778017537345}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.508438587476658, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0030967236462497586}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4814718095446795, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002740769966051787}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4719066444266488, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0021232213144874593}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2543070392775442, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0025002270899075695}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2386513703857796, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0022344362770068673}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.2335596273503415, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0019811310308482434}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.3699950720656377, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0026651187832523664}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.35074320852708746, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002429104142195895}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.34320081095568616, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001977144393265691}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.427080652482253, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002971111279966823}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.40443782365098674, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0026631012930175323}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3963766746924401, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.00219952367965179}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_0.json b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..9f58f181cb1eef26957f47addf93e0391152dd76 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.1675664806545814, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002452603521749886}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.34303659164580813, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00451220621305511}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.2155668468544653, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0026646559073492822}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.03864946281782141, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0014769194957715624}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.08335808413265051, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002908314864654091}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.05045080374949566, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0017576960885745984}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.12702750275933555, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001968823066408308}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.26154017483908965, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003585895961808971}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.1635478469839484, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0021077578920492917}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.13051144332858214, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0020713501923767027}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.26981706823174656, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003957679243103724}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.16836751227813998, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022998758409405514}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 2.160170846637464, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09889873775096984}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_1.json b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..dbf376fe83b5c3601c790494fec59d8d59362b36 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.13520973640137626, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001930299351096568}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.3323577264719374, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004491568598510519}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.1898050764365515, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0025895313777244354}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.03140636068492149, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001113870373266841}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.08109440867971819, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0029471809124174825}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.04465858992847766, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0015759770915751918}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.10636283963297354, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014233454751993193}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.26423746064810627, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003579439421960654}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.14968873061397606, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001933469116399493}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.10653719114272985, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0015634601753452939}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.26451619174803076, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003902068769045215}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.14993016736293346, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0021358853384488446}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.8701953699144762, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.05457096063405516}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_2.json b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..0df6e990dfd9b91ece87489af979ac4aec8be9e9 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.1369596940677527, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018924121735394107}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.33267847518896543, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004382896639279902}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.1913140581117672, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0025051242733995895}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.03283865595587313, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0011141105617716379}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.08404626501275646, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0029766014928721417}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.046514407795467595, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0015752063358252097}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.11105944816976555, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014582290975397828}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.27226184993618935, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003638521351468343}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.1555172607724421, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019665304832963766}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.10559932998246374, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0015493840715498106}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2597115453851503, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003887704936356228}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.148021529852108, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0021093930620772303}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.8292996100546781, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08163094513619551}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_3.json b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..69015630de908bb4deb349ceee3d88141adcbf53 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.13421303891622097, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0021412802231387967}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.310980261970668, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004684135200277263}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.1828325966117306, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0026884744365811403}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.03176375904264973, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0011285744197009628}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.0771291588842163, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0028009360577460445}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.043981143624385655, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0015389553455476062}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.11010971775440595, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0017060839433245796}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.257265478142769, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003940518987777604}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.15042887440453737, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002182144987791837}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.10364375570761218, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0017533516458810485}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.24201646695848927, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004005217279812412}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.14143730410765654, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022370123860963476}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.729714249041032, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09968587223572584}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_4.json b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..976676bdec19b00163c05e626210eec07ce7ecdf --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.04440086644350133, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0028076146832161425}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.0803342918035357, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004572536216376621}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.0521003876015691, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002910995728301919}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.011721386490746217, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001394908515617324}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.020621720002167342, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0017793611110912008}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.01307647569779615, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011218803952754701}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.03669834695042482, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0023530729136330853}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.06682107529885967, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0038307757001802474}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.04296796327738306, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002392166194141485}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.03617640134116618, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0023748208613590294}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.06502829732266231, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003786163884263381}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.042028608773829565, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0023859608992589927}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.9890184534659001, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.14163039170125274}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_5.json b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..66fad039c478c8412c2ce0139c4836c6764a7e85 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/agg.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.003536517824005411, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0010348361693354221}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.0026502867716370814, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0007219200372674768}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.002975946933660433, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0008325096950346747}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.0007216185282223018, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00028726019405366274}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.00047841047841047846, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00018648358251820024}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.0005678964868499288, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00022071683514847003}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.0027483075773717747, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0008030756319798513}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.0021047616766507017, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0005731278953348982}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.002335136000302258, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.000650477644840957}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.0029063810983753734, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0008739925650642316}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.0021888663476128875, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0006063079941836999}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.0024473347701190456, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0006984333555662036}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.3300633595706627e-37, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 2.704529748702706e-32}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_0.jsonl b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..a5b00fe26ecb4ab4011b041bb9b23a8b819d1b87 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d9198ee8c081fd9bdb570fa4b79f13b97318d926aab0405d9aadd5bc479f461 +size 4121966 diff --git a/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_1.jsonl b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c7199201e3af842c15cafa8d6f859b916e876877 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d114c788acfb9bd66c8fb2544f114aa0645e302c45ec3f645d9c491328f0764 +size 5056668 diff --git a/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_2.jsonl b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..34ec7daffceec34b0756b22e334eb145f894da05 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec98038483a009d443f1bf75b4151039f349dc77f944d2cc203d7259ff915024 +size 5999885 diff --git a/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_3.jsonl b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e3c1d8fee6c74a3ee832c2fe4a09dfeaa5c67608 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeafa1658ea3fe1c33ca1088b0b751e569509f624a9d73fbc52a085fa3bb9d67 +size 6928028 diff --git a/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_4.jsonl b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..6ded49ce81d3a9fa9c1bece88d3b93a5729dcdf5 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab7852f5e9f3aa4687558737c4a7c92012a826f4d0fcebedf85b04875d3c58e4 +size 7845786 diff --git a/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_5.jsonl b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..f1426a8833e655a6bd476d474df5a7306c7c9c07 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed903171fd63f716fe17e450bd00977d3238b5b382980a124c61300cfa01d873 +size 8756079 diff --git a/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_0.jsonl b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..4bb1a960cff5ce7ea23502fdb8e1d73e9c9ec2c2 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7179c65e6207fed6a86c2915fe4365e85d4ce798acae22f0ee8c2c7b8bc3d7be +size 7690380 diff --git a/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_1.jsonl b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..b48c1aac162b61808d834cfe9f549b9bf5c18b5b --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e2fe3258e8b26192f8ea504e7161d4298d56acd7741e105e18dfabf6d6804e6 +size 13242639 diff --git a/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_2.jsonl b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..8627b800130ab99d9a52ea8224918673a74b2779 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e382af6786f73696871e6e3b9ada1c8845ff3f86280c125c13cf749c1dc85855 +size 18793270 diff --git a/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_3.jsonl b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..499ef601d02751328ae3a58dd474c01cdb026d3f --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:340910439bd65c60e0969342c67f3142ee770615d76376589883b389a4ab43ff +size 24211968 diff --git a/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_4.jsonl b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e026fdf504be8e3519a222f7988d06de44831997 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b22fc7c23a42fabb4c1def91d5543826b91318a75052e75924c4f0d55836e173 +size 29436243 diff --git a/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_5.jsonl b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..6e7b2d43f4f5f54be69eddf1955157b71dcd03b4 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f8fbde5f8221219858d7d9cb0e1796f99cddab65e72a7fc30d289f369a974d0 +size 34794398 diff --git a/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..6b4a3a710887b30d06af34872c76fe6a18f3c988 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78603a29802b1994b4e0f550d426143eec44060041356e4236a5b23e2a7a3a55 +size 3953675 diff --git a/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..a20dc8d4ade83f7c889fd13eaeb66c0892ea2ad9 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1460d7702acdc284add41dbd874ded0b54806b2810d32305b6d29a00e509dd50 +size 5049795 diff --git a/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..4a294a17f07a8b66c7f0801e94a605442458f6eb --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1ea63ba263e4c85c99a00eb6e09ed04ab4d2164667de826eaf84c177f2acd13 +size 6141965 diff --git a/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..31714328eba0195985300558c37e91b6e1cd238c --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:479c619759476751b2f4b97ba0e90e44b14cca98a9bf3b9769190536b82e3651 +size 7245471 diff --git a/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..653b4d1a03e0e1b20c61129ae5b68a843aa297f5 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1740f85fa369914567607fff601cb1d877f4abda1cc0c11bc998b58dbae697f1 +size 8348119 diff --git a/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..31e05ed4506ac6d58312366c799bc64ffc9e40ef --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70efb972f916ac3999f1c4252e347d3a42598ceb9e5cc1004a5c53dd79eab7a6 +size 9435134 diff --git a/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_0.jsonl b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..2d3b045ec867c755d639f487cfb31b4d68198c97 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37861a7c57f19b1a516d7e365b45424f85a226b2987e0f0d0047a834bf59575b +size 2798549 diff --git a/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_1.jsonl b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..78266d5fbeed3b9aaf0e00f181f7e5e909d49435 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e18e447ed7393c0394f3c16b50b9a370e568295881347477a148a5c1bfa1cfe +size 5105029 diff --git a/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_2.jsonl b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..df099bcfc89781378e6f315336c3c6a62a890ce0 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91e0d9be8d71ccd10482e7e61c1a209de302978c2a5d6b82487eaeea06257e9c +size 7377651 diff --git a/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_3.jsonl b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..f6b003c3d8d112f00cca312bb027c5f69b07a718 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:843e49747c8a627dc70ccf0dbc8f5f9619f8eac8f28cd2a94c56844d307efb1e +size 9646002 diff --git a/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_4.jsonl b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..ff6cdd1636dd1fa5f0ea70640107e664cda02eed --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f95506c602d1d2f92d5d6e59f5cbaf9d3ddc71003c340c2399dd20c1f7e0ea40 +size 11671647 diff --git a/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_5.jsonl b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..9f5eedb37058f4caf85d47b422dd1810a7c9007c --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/examples.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef30de121370148502db0cac80d7f8e674a66c022cd9492bf3db02834362403d +size 13897488 diff --git a/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..202b58b8a7c7f85c98be0d66e87503c096296afa --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.4561902687825146, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.045631246828587047 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07625749807589129, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0015146545254109735 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3307426476163128, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.00456779888031621 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11679844154672582, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0019568915949739994 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03608151986203413, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009254470422146193 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.16229717802554836, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0032223185692842058 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.0554093381893294, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012327294395014525 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07353494344552397, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0013741278529976802 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3230730872507571, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004482961394584532 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.11311445429105703, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0018346474985473178 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07303744482119352, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0014379306638165714 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.31705954495780236, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004318803443289957 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11188332112192871, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018465577738166203 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..b991507956dd2eeb9c24c7858a0d2527d7eb9d7d --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.5886516458334025, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03717726878870121 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.08026566053193719, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0014159639116614112 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3942157437513017, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005461079688404384 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.12548839335267944, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001928881826547231 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.038000879190334146, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008787103935280456 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.19923195745941746, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003907735021234661 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.059755176813484405, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012347079912433854 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07552316506586856, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.00123012987736281 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3738994305484677, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.005048426209720286 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.1183744839063624, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0016906391136317978 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07603490019116672, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001311880863082997 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.37313363669466976, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004995079076932912 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11887135903817798, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017838888979302661 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..c8c04c37ad88a93a4fb7134954b948e9b4776cb5 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.6600722092729007, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03519197756328506 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07745497341270637, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0012346921599162308 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.41190076505770906, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005377825981214025 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.1228359376509253, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017091878261403075 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.035903159669296886, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007708405381290396 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.20783156644312073, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0039023098470249125 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05732608605259917, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011019893164004922 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07197458828228794, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001092373974273461 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3823575589838747, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004836437439878737 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.11414361148332351, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015117695102111128 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07349628109207673, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0011632716540392056 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3899929430530594, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004966781612279243 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11649612591713067, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016039234092463776 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..fc4412bd97f837bc716453ffd6fbd39f295361b6 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.7938690838487434, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.031249006432413233 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.0802242746933909, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0012915264518391 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.432425410033066, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005388624217576616 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.12765986861457063, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017842279285890702 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03742102127943016, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007953067755003365 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.22000051519312314, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.00404703168782795 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.060003612710909315, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001146664477215343 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07327312156062743, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0011113752501149396 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.39487814553889183, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004737789640173793 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.11660022195969111, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015332520691398934 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07598267078545315, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001204590796246913 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.4089805013247068, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004967802237281888 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.12088469182871771, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001661523804555607 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..dc36a1dc16f95a642b8801514b3704faf940fa07 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.8218123055098046, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.044246313732840256 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07753724548278816, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0011900746777565759 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.4341910857165979, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005446504875155181 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.12410661735510435, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001658918514736671 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03630893474019336, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007351259548705939 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.2243388369397611, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.004106316366094987 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.058623697481614896, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010716614020870505 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07062282112602274, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0010428980489891116 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3935550435860648, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004760493217032566 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.11289953851936033, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0014402500630831217 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07330274436223451, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0011220316964088218 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.4085243199495146, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0049771427706643894 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.1172028966984663, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001554404781749481 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..b24431ba6a180b24e185f8e25824c791447f0a73 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.913925260231582, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.051763978663194966 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07874146764038398, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0012134560937164121 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.45109520601285813, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005553088446218645 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.12641834793897835, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0016320788274985598 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03656608773889105, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.000760846094550187 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.23230496648757598, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.004227400481066823 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05915409533137278, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010512753815705362 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07104014696908037, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0010444495191682013 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.40599373509139014, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.00482831666482983 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.11387146771889235, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0013950097533787038 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07423831821118593, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0011248214939780865 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.424873549364599, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.005112245054065837 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11913823061282955, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0015199756969136377 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..a47f7b841b7bc4e5801ca63babae65447ee6a438 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.1490543596959789, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0019546229536216812 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.25389546448233424, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002741124482183061 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.1745670903777373, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0019234371005345781 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.03016441545474279, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007719528814370501 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.053419440384246994, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0014288658559341756 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.03547451018256482, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0008627729378350705 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.11627822506127969, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0013862347099417346 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.2054884045718469, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002244877757105672 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.13785667531218, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0013936984378312576 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.13663769110467477, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0017798375104242446 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.23440517613484713, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0025460475763855804 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.16028302243607997, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017474929334903653 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.6235229126061184, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.07158856142385593 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..6771fd383bf2bd8f69f323243a2fd4a6622ea696 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.22331912988940492, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0027687942933625823 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.3105879084943194, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0029250201802578303 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.22808328022499394, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0020320515676967767 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.06014163619235408, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.001549861456149217 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.08133586965727622, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0017304100412085226 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.05894457560206053, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001148762569744268 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.16233563631626566, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0021600975326785993 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.22817247618168887, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0023092419967920526 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.16440728290895265, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001417667346489937 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.2095322539144404, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.002623522761491815 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.29186247430489015, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0027828596792989963 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.2138081154409409, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0019073843040340796 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 3.148014517976192, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.08632853762954663 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..f79a338c4ac7204099789b278278462e2253d26b --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.25284242615549224, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.003346416305554945 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.2985206799819407, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002872417745008737 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.23269927040845031, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0020394436744448855 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.07352861081692932, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.001975577012025009 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.08045188272326337, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.001687564851802267 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.06308783765355935, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012452038663643937 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.18896530779163317, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0027402813839447243 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.22165381331302203, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0022793478208025125 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.1711468063140619, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015216107571068406 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.23906918273035027, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.003206715750850772 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.2821026125213223, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0027371552638994733 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.2196667775453629, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0019303318209296886 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 3.648405351452855, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.12713119304572523 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..d903b5fd691e161ff6ed9bda3c4744d4c9581a96 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.21412240705416308, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.003573906850229763 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.2363591035613763, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0032427476384113535 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.18860588124930222, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.002411594336470169 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.0620187002238152, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.001908345830156357 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.0644931653305227, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.001637056221909264 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.051285956226699604, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012327125521204533 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.1623855639995828, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.002892414171534976 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.17796581661301386, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0025623361467453773 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.14052920532911936, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0018198320452371584 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.20310628745671855, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0034230022998127862 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.22379283876686262, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0030762140186834028 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.17844826504839648, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0022785596409348953 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 3.6829199554261502, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.08848427999980182 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..ccf9348ac1453aa05825921ef4be87bf02764a77 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.06596988964164227, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0026452643433214004 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.07786694962495821, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002793778795842796 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.058680633472697495, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0020527112852523396 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.018662630886825272, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0011852493101770921 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.021659652341736273, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0011776028400838929 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.015912520231271727, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0008257625671288616 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.05090308576277237, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.002121767282678217 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.05971715204113024, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002201135080103992 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.04448068031172814, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015668077231183733 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.06266723632734954, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.002537275263785622 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.07362961134314913, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0026439669964067034 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.055493537558428035, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001944192579335498 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 0.4977010788321425, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.029197504340406147 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..b822f8e80a74bfb6cbbe9e26d5dd4398ab8a6e70 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.009347302370204104, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0009939432842913038 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.012675375103590819, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0012741296212300682 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.009019405424799239, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0008796953070286968 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.002520125545331128, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.00043890835709493897 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.0034745962063106794, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0004926837590871648 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.002459973367560091, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0003520874137724776 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.007379431863883617, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0008249510021821957 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.009772980431375072, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0009978936334822926 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.006955043299953472, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0006891726751168752 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.008880786469979814, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0009541098770127502 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.011981285756158963, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0012073677632838248 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.008527269899079934, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0008337482953004597 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 8.62147070684518e-08, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 2.4998412186774315e-07 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..94adc965e0ea1b438fe5879aa84ef05203ea45a1 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 2.5190605487649087, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.14578061564278902 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.12015610790826121, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0026013907575401264 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.1007142822326354, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0025699976738232087 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.08785204369989494, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.001909841985405621 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.021978597704618782, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0011061787510217053 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.026856846878022297, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0012249926502431994 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.020631873410295806, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0008986868448192905 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.11432207717597319, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002375152014750786 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.09673002538661275, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0024476967854968764 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.083870708743602, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0017764834490443292 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.10920558363229785, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0023563322630614446 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.08646567425286227, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0022239273238183668 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.0771386142988915, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016644247241633418 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..81ecbc2a4da0abc85250ee93970a0c102cd3f5bb --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 11.471305506037798, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.07875003513092577 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5170379371586666, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0033287522955400954 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4239211672299534, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002947218737469124 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.43708472576518986, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.00224171007536442 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.24177763061210847, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0026337382842525014 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.1931046855790191, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0020767023449716755 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.19998119743920914, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0019048339787913725 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.3792838934227107, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002982844793468976 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3062355213393646, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0023427585826778815 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.31725506977900303, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0019449957706219145 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.42712804511272506, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003164747958067866 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3486090540172501, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002679539945997737 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3599294935860651, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0021823306634720274 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..6ce9aebc57ea9b6b9b9fa7c9b57355b0a8b89aa2 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 13.980968022690044, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.21821573679070036 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5445902709342957, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.00337974740434529 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.458944313155064, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0029017981497803163 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.47004796009089583, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0022258968023120985 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2713453392654981, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002780199873202826 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2245350505416365, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0022393722057462194 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.23012493273504447, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.002033859795223151 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.4018381948627221, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0030321901639654486 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.33679603771757866, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002478135715528108 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.34524196268248847, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0020571216808165926 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.45423494017342136, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003233814196249404 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3829304393507027, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027623882797974796 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.39203827558400783, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0022732280818521912 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..36461f284d04059cf5c05c439f367c7488cc8c02 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 14.154980307761505, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.1448658074579454 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5290233700279933, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003286733532241089 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4695155836113227, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0028589858065198362 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4705643512917158, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.00214940659696796 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.265538771393177, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0026553555632510255 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.23270443394551238, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0022448787273333173 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.23283631982568367, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0019771157251113228 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.39229315419704086, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0029631232557498915 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3458978765243631, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0024472277771961978 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3471376353301056, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0020102129845005895 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.44487893090959907, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003164337474810978 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.39451585686809876, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002730627600611841 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3954525442177938, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0022179179708118656 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..1afdadcd76b1034d1eab4c964c1d61ec8f1d7d1c --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 13.721038666752582, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.17683442815246456 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5089881039212353, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0031941598167466606 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.479032657967036, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002765675705775823 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4691628743032071, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002144459294602491 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2551097554402564, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002576496565725004 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.23713242535420967, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.00222316717149407 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.23219088772710936, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.001982880603357365 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.37390882033029804, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0028070940255931595 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3512215949214737, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0024022657027433863 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3437342989792434, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0019737589675455874 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.4277340821604659, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003042188683426346 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.40285522466618634, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0026869688850980986 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.39438992601573425, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0022083897072610196 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..5f9667fa6116f32968d876f1cb516dea54f31478 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 13.685692148533645, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.18475778017537345 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.508438587476658, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0030967236462497586 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4814718095446795, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002740769966051787 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4719066444266488, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0021232213144874593 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2543070392775442, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0025002270899075695 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2386513703857796, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0022344362770068673 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.2335596273503415, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0019811310308482434 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.3699950720656377, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0026651187832523664 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.35074320852708746, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002429104142195895 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.34320081095568616, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.001977144393265691 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.427080652482253, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.002971111279966823 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.40443782365098674, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0026631012930175323 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3963766746924401, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.00219952367965179 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_0.json b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..015f8e96c08acfa0f7e04fbe03fa8e87b09d94f0 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.1675664806545814, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.002452603521749886 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.34303659164580813, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.00451220621305511 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.2155668468544653, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0026646559073492822 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.03864946281782141, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0014769194957715624 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.08335808413265051, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002908314864654091 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.05045080374949566, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0017576960885745984 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.12702750275933555, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.001968823066408308 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.26154017483908965, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003585895961808971 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.1635478469839484, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0021077578920492917 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.13051144332858214, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0020713501923767027 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.26981706823174656, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003957679243103724 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.16836751227813998, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0022998758409405514 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 2.160170846637464, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.09889873775096984 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_1.json b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..a449c21d0eca0534a4fed54afa59a54735235ac9 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.13520973640137626, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.001930299351096568 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.3323577264719374, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004491568598510519 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.1898050764365515, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0025895313777244354 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.03140636068492149, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.001113870373266841 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.08109440867971819, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0029471809124174825 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.04465858992847766, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0015759770915751918 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.10636283963297354, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0014233454751993193 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.26423746064810627, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003579439421960654 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.14968873061397606, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.001933469116399493 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.10653719114272985, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0015634601753452939 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.26451619174803076, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003902068769045215 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.14993016736293346, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0021358853384488446 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.8701953699144762, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.05457096063405516 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_2.json b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..6dd419292c9eb74832c2d46dd8c7ea2e902584ed --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.1369596940677527, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0018924121735394107 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.33267847518896543, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004382896639279902 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.1913140581117672, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0025051242733995895 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.03283865595587313, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0011141105617716379 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.08404626501275646, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0029766014928721417 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.046514407795467595, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0015752063358252097 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.11105944816976555, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0014582290975397828 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.27226184993618935, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003638521351468343 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.1555172607724421, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0019665304832963766 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.10559932998246374, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0015493840715498106 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2597115453851503, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003887704936356228 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.148021529852108, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0021093930620772303 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.8292996100546781, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.08163094513619551 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_3.json b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..a90f6f4cf8bc3dbde5997aa666cf466e7a8e8a4e --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.13421303891622097, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0021412802231387967 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.310980261970668, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004684135200277263 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.1828325966117306, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0026884744365811403 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.03176375904264973, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0011285744197009628 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.0771291588842163, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0028009360577460445 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.043981143624385655, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0015389553455476062 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.11010971775440595, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0017060839433245796 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.257265478142769, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003940518987777604 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.15042887440453737, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.002182144987791837 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.10364375570761218, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0017533516458810485 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.24201646695848927, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.004005217279812412 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.14143730410765654, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0022370123860963476 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.729714249041032, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.09968587223572584 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_4.json b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..e39ab1c60c58807ade253f5d07ca0140f49f38cb --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.04440086644350133, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0028076146832161425 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.0803342918035357, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004572536216376621 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.0521003876015691, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002910995728301919 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.011721386490746217, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.001394908515617324 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.020621720002167342, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0017793611110912008 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.01307647569779615, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0011218803952754701 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.03669834695042482, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0023530729136330853 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.06682107529885967, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0038307757001802474 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.04296796327738306, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.002392166194141485 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.03617640134116618, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0023748208613590294 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.06502829732266231, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003786163884263381 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.042028608773829565, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0023859608992589927 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.9890184534659001, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.14163039170125274 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_5.json b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..ff98b127f17fc4519699a7fc059ad65ff572a6f0 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/generation/slim.4b284b84bc4v2seed2_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.003536517824005411, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0010348361693354221 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.0026502867716370814, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0007219200372674768 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.002975946933660433, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0008325096950346747 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.0007216185282223018, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.00028726019405366274 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.00047841047841047846, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.00018648358251820024 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.0005678964868499288, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.00022071683514847003 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.0027483075773717747, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0008030756319798513 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.0021047616766507017, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0005731278953348982 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.002335136000302258, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.000650477644840957 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.0029063810983753734, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0008739925650642316 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.0021888663476128875, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0006063079941836999 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.0024473347701190456, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0006984333555662036 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.3300633595706627e-37, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 2.704529748702706e-32 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/rankeval/4b284b84bc4v2seed2_0.json b/4b284b84bc4v2seed2/evaluation/rankeval/4b284b84bc4v2seed2_0.json new file mode 100644 index 0000000000000000000000000000000000000000..950b0d0a3c5c0a7e31a1aeb1e46d770fc3673ba5 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/rankeval/4b284b84bc4v2seed2_0.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.335, + "acc_stderr": 0.014933117490932575 + }, + "anli_r2": { + "acc": 0.333, + "acc_stderr": 0.014910846164229857 + }, + "anli_r3": { + "acc": 0.3416666666666667, + "acc_stderr": 0.013696658778002512 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.0663363415035954, + "f1": 0.1940928270042194 + }, + "copa": { + "acc": 0.83, + "acc_stderr": 0.03775251680686371 + }, + "hellaswag": { + "acc": 0.48207528380800635, + "acc_stderr": 0.004986573992451681, + "acc_norm": 0.6312487552280422, + "acc_norm_stderr": 0.004814803098436799 + }, + "rte": { + "acc": 0.5451263537906137, + "acc_stderr": 0.029973636495415252 + }, + "winogrande": { + "acc": 0.5832675611681136, + "acc_stderr": 0.013856250072796318 + }, + "storycloze_2016": { + "acc": 0.7252805986103688, + "acc_stderr": 0.010322309878339504 + }, + "boolq": { + "acc": 0.5804281345565749, + "acc_stderr": 0.008631175489166722 + }, + "arc_easy": { + "acc": 0.61489898989899, + "acc_stderr": 0.009985214798737247, + "acc_norm": 0.5349326599326599, + "acc_norm_stderr": 0.010234713052723684 + }, + "arc_challenge": { + "acc": 0.26791808873720135, + "acc_stderr": 0.012942030195136432, + "acc_norm": 0.2909556313993174, + "acc_norm_stderr": 0.013273077865907581 + }, + "sciq": { + "acc": 0.833, + "acc_stderr": 0.011800434324644586, + "acc_norm": 0.747, + "acc_norm_stderr": 0.01375427861358708 + }, + "piqa": { + "acc": 0.7616974972796517, + "acc_stderr": 0.009940334245876203, + "acc_norm": 0.7665941240478781, + "acc_norm_stderr": 0.009869247889520993 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/rankeval/4b284b84bc4v2seed2_0_lm-eval_global_step80108_2023-02-22-18-53-17_0shots_backup.json b/4b284b84bc4v2seed2/evaluation/rankeval/4b284b84bc4v2seed2_0_lm-eval_global_step80108_2023-02-22-18-53-17_0shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..950b0d0a3c5c0a7e31a1aeb1e46d770fc3673ba5 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/rankeval/4b284b84bc4v2seed2_0_lm-eval_global_step80108_2023-02-22-18-53-17_0shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.335, + "acc_stderr": 0.014933117490932575 + }, + "anli_r2": { + "acc": 0.333, + "acc_stderr": 0.014910846164229857 + }, + "anli_r3": { + "acc": 0.3416666666666667, + "acc_stderr": 0.013696658778002512 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.0663363415035954, + "f1": 0.1940928270042194 + }, + "copa": { + "acc": 0.83, + "acc_stderr": 0.03775251680686371 + }, + "hellaswag": { + "acc": 0.48207528380800635, + "acc_stderr": 0.004986573992451681, + "acc_norm": 0.6312487552280422, + "acc_norm_stderr": 0.004814803098436799 + }, + "rte": { + "acc": 0.5451263537906137, + "acc_stderr": 0.029973636495415252 + }, + "winogrande": { + "acc": 0.5832675611681136, + "acc_stderr": 0.013856250072796318 + }, + "storycloze_2016": { + "acc": 0.7252805986103688, + "acc_stderr": 0.010322309878339504 + }, + "boolq": { + "acc": 0.5804281345565749, + "acc_stderr": 0.008631175489166722 + }, + "arc_easy": { + "acc": 0.61489898989899, + "acc_stderr": 0.009985214798737247, + "acc_norm": 0.5349326599326599, + "acc_norm_stderr": 0.010234713052723684 + }, + "arc_challenge": { + "acc": 0.26791808873720135, + "acc_stderr": 0.012942030195136432, + "acc_norm": 0.2909556313993174, + "acc_norm_stderr": 0.013273077865907581 + }, + "sciq": { + "acc": 0.833, + "acc_stderr": 0.011800434324644586, + "acc_norm": 0.747, + "acc_norm_stderr": 0.01375427861358708 + }, + "piqa": { + "acc": 0.7616974972796517, + "acc_stderr": 0.009940334245876203, + "acc_norm": 0.7665941240478781, + "acc_norm_stderr": 0.009869247889520993 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/rankeval/4b284b84bc4v2seed2_1.json b/4b284b84bc4v2seed2/evaluation/rankeval/4b284b84bc4v2seed2_1.json new file mode 100644 index 0000000000000000000000000000000000000000..74d9db589a2a1dc742efbd3589ba51e1e8b6d38f --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/rankeval/4b284b84bc4v2seed2_1.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.334, + "acc_stderr": 0.014922019523732963 + }, + "anli_r2": { + "acc": 0.333, + "acc_stderr": 0.014910846164229868 + }, + "anli_r3": { + "acc": 0.3491666666666667, + "acc_stderr": 0.013767075395077247 + }, + "cb": { + "acc": 0.35714285714285715, + "acc_stderr": 0.0646095738380922, + "f1": 0.23179160021265285 + }, + "copa": { + "acc": 0.79, + "acc_stderr": 0.040936018074033256 + }, + "hellaswag": { + "acc": 0.48088030272854015, + "acc_stderr": 0.004986131919673967, + "acc_norm": 0.630053774148576, + "acc_norm_stderr": 0.004818031396138917 + }, + "rte": { + "acc": 0.5667870036101083, + "acc_stderr": 0.029826764082138277 + }, + "winogrande": { + "acc": 0.5951065509076559, + "acc_stderr": 0.013795927003124939 + }, + "storycloze_2016": { + "acc": 0.7204703367183325, + "acc_stderr": 0.01037770209970486 + }, + "boolq": { + "acc": 0.599388379204893, + "acc_stderr": 0.008570545612096374 + }, + "arc_easy": { + "acc": 0.6212121212121212, + "acc_stderr": 0.009953737656542035, + "acc_norm": 0.5833333333333334, + "acc_norm_stderr": 0.010116282977781254 + }, + "arc_challenge": { + "acc": 0.29266211604095566, + "acc_stderr": 0.013295916103619411, + "acc_norm": 0.3225255972696246, + "acc_norm_stderr": 0.01365998089427737 + }, + "sciq": { + "acc": 0.887, + "acc_stderr": 0.010016552866696848, + "acc_norm": 0.876, + "acc_norm_stderr": 0.01042749887234396 + }, + "piqa": { + "acc": 0.7529923830250272, + "acc_stderr": 0.01006226814077262, + "acc_norm": 0.7627856365614799, + "acc_norm_stderr": 0.009924694933586374 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/rankeval/4b284b84bc4v2seed2_1_lm-eval_global_step80108_2023-02-22-18-53-17_1shots_backup.json b/4b284b84bc4v2seed2/evaluation/rankeval/4b284b84bc4v2seed2_1_lm-eval_global_step80108_2023-02-22-18-53-17_1shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..74d9db589a2a1dc742efbd3589ba51e1e8b6d38f --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/rankeval/4b284b84bc4v2seed2_1_lm-eval_global_step80108_2023-02-22-18-53-17_1shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.334, + "acc_stderr": 0.014922019523732963 + }, + "anli_r2": { + "acc": 0.333, + "acc_stderr": 0.014910846164229868 + }, + "anli_r3": { + "acc": 0.3491666666666667, + "acc_stderr": 0.013767075395077247 + }, + "cb": { + "acc": 0.35714285714285715, + "acc_stderr": 0.0646095738380922, + "f1": 0.23179160021265285 + }, + "copa": { + "acc": 0.79, + "acc_stderr": 0.040936018074033256 + }, + "hellaswag": { + "acc": 0.48088030272854015, + "acc_stderr": 0.004986131919673967, + "acc_norm": 0.630053774148576, + "acc_norm_stderr": 0.004818031396138917 + }, + "rte": { + "acc": 0.5667870036101083, + "acc_stderr": 0.029826764082138277 + }, + "winogrande": { + "acc": 0.5951065509076559, + "acc_stderr": 0.013795927003124939 + }, + "storycloze_2016": { + "acc": 0.7204703367183325, + "acc_stderr": 0.01037770209970486 + }, + "boolq": { + "acc": 0.599388379204893, + "acc_stderr": 0.008570545612096374 + }, + "arc_easy": { + "acc": 0.6212121212121212, + "acc_stderr": 0.009953737656542035, + "acc_norm": 0.5833333333333334, + "acc_norm_stderr": 0.010116282977781254 + }, + "arc_challenge": { + "acc": 0.29266211604095566, + "acc_stderr": 0.013295916103619411, + "acc_norm": 0.3225255972696246, + "acc_norm_stderr": 0.01365998089427737 + }, + "sciq": { + "acc": 0.887, + "acc_stderr": 0.010016552866696848, + "acc_norm": 0.876, + "acc_norm_stderr": 0.01042749887234396 + }, + "piqa": { + "acc": 0.7529923830250272, + "acc_stderr": 0.01006226814077262, + "acc_norm": 0.7627856365614799, + "acc_norm_stderr": 0.009924694933586374 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/rankeval/4b284b84bc4v2seed2_2.json b/4b284b84bc4v2seed2/evaluation/rankeval/4b284b84bc4v2seed2_2.json new file mode 100644 index 0000000000000000000000000000000000000000..d360b8ff3ed404cd5ab315dffa40652568ddfe03 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/rankeval/4b284b84bc4v2seed2_2.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.335, + "acc_stderr": 0.014933117490932573 + }, + "anli_r2": { + "acc": 0.334, + "acc_stderr": 0.014922019523732954 + }, + "anli_r3": { + "acc": 0.3425, + "acc_stderr": 0.013704669762934727 + }, + "cb": { + "acc": 0.39285714285714285, + "acc_stderr": 0.0658538889806635, + "f1": 0.258008658008658 + }, + "copa": { + "acc": 0.83, + "acc_stderr": 0.03775251680686371 + }, + "hellaswag": { + "acc": 0.4801832304321848, + "acc_stderr": 0.0049858608534276315, + "acc_norm": 0.6342362079267079, + "acc_norm_stderr": 0.004806593424942264 + }, + "rte": { + "acc": 0.5703971119133574, + "acc_stderr": 0.02979666882912467 + }, + "winogrande": { + "acc": 0.6029992107340174, + "acc_stderr": 0.013751092519806702 + }, + "storycloze_2016": { + "acc": 0.72367717797969, + "acc_stderr": 0.010340939873166822 + }, + "boolq": { + "acc": 0.6048929663608563, + "acc_stderr": 0.0085504542482809 + }, + "arc_easy": { + "acc": 0.6224747474747475, + "acc_stderr": 0.009947227833469432, + "acc_norm": 0.6047979797979798, + "acc_norm_stderr": 0.010031894052790978 + }, + "arc_challenge": { + "acc": 0.2935153583617747, + "acc_stderr": 0.01330725044494113, + "acc_norm": 0.32764505119453924, + "acc_norm_stderr": 0.013715847940719346 + }, + "sciq": { + "acc": 0.913, + "acc_stderr": 0.008916866630745908, + "acc_norm": 0.897, + "acc_norm_stderr": 0.009616833339695798 + }, + "piqa": { + "acc": 0.7546245919477693, + "acc_stderr": 0.010039831320422401, + "acc_norm": 0.7622415669205659, + "acc_norm_stderr": 0.009932525779525492 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/rankeval/4b284b84bc4v2seed2_2_lm-eval_global_step80108_2023-02-22-18-53-17_2shots_backup.json b/4b284b84bc4v2seed2/evaluation/rankeval/4b284b84bc4v2seed2_2_lm-eval_global_step80108_2023-02-22-18-53-17_2shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..d360b8ff3ed404cd5ab315dffa40652568ddfe03 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/rankeval/4b284b84bc4v2seed2_2_lm-eval_global_step80108_2023-02-22-18-53-17_2shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.335, + "acc_stderr": 0.014933117490932573 + }, + "anli_r2": { + "acc": 0.334, + "acc_stderr": 0.014922019523732954 + }, + "anli_r3": { + "acc": 0.3425, + "acc_stderr": 0.013704669762934727 + }, + "cb": { + "acc": 0.39285714285714285, + "acc_stderr": 0.0658538889806635, + "f1": 0.258008658008658 + }, + "copa": { + "acc": 0.83, + "acc_stderr": 0.03775251680686371 + }, + "hellaswag": { + "acc": 0.4801832304321848, + "acc_stderr": 0.0049858608534276315, + "acc_norm": 0.6342362079267079, + "acc_norm_stderr": 0.004806593424942264 + }, + "rte": { + "acc": 0.5703971119133574, + "acc_stderr": 0.02979666882912467 + }, + "winogrande": { + "acc": 0.6029992107340174, + "acc_stderr": 0.013751092519806702 + }, + "storycloze_2016": { + "acc": 0.72367717797969, + "acc_stderr": 0.010340939873166822 + }, + "boolq": { + "acc": 0.6048929663608563, + "acc_stderr": 0.0085504542482809 + }, + "arc_easy": { + "acc": 0.6224747474747475, + "acc_stderr": 0.009947227833469432, + "acc_norm": 0.6047979797979798, + "acc_norm_stderr": 0.010031894052790978 + }, + "arc_challenge": { + "acc": 0.2935153583617747, + "acc_stderr": 0.01330725044494113, + "acc_norm": 0.32764505119453924, + "acc_norm_stderr": 0.013715847940719346 + }, + "sciq": { + "acc": 0.913, + "acc_stderr": 0.008916866630745908, + "acc_norm": 0.897, + "acc_norm_stderr": 0.009616833339695798 + }, + "piqa": { + "acc": 0.7546245919477693, + "acc_stderr": 0.010039831320422401, + "acc_norm": 0.7622415669205659, + "acc_norm_stderr": 0.009932525779525492 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/rankeval/4b284b84bc4v2seed2_3.json b/4b284b84bc4v2seed2/evaluation/rankeval/4b284b84bc4v2seed2_3.json new file mode 100644 index 0000000000000000000000000000000000000000..979c2816027792946efcf70312b1d8dc65be9fe4 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/rankeval/4b284b84bc4v2seed2_3.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.319, + "acc_stderr": 0.014746404865473472 + }, + "anli_r2": { + "acc": 0.341, + "acc_stderr": 0.014998131348402704 + }, + "anli_r3": { + "acc": 0.3566666666666667, + "acc_stderr": 0.013833742805050722 + }, + "cb": { + "acc": 0.39285714285714285, + "acc_stderr": 0.0658538889806635, + "f1": 0.224400871459695 + }, + "copa": { + "acc": 0.83, + "acc_stderr": 0.03775251680686371 + }, + "hellaswag": { + "acc": 0.4819757020513842, + "acc_stderr": 0.004986538243846636, + "acc_norm": 0.6331408086038638, + "acc_norm_stderr": 0.004809626723626843 + }, + "rte": { + "acc": 0.5631768953068592, + "acc_stderr": 0.029855247390314945 + }, + "winogrande": { + "acc": 0.6045777426992897, + "acc_stderr": 0.013741678387545347 + }, + "storycloze_2016": { + "acc": 0.7279529663281668, + "acc_stderr": 0.010290888060871242 + }, + "boolq": { + "acc": 0.6162079510703364, + "acc_stderr": 0.008505584729104983 + }, + "arc_easy": { + "acc": 0.6292087542087542, + "acc_stderr": 0.009911292822056923, + "acc_norm": 0.6136363636363636, + "acc_norm_stderr": 0.009991296778159617 + }, + "arc_challenge": { + "acc": 0.2986348122866894, + "acc_stderr": 0.013374078615068756, + "acc_norm": 0.3225255972696246, + "acc_norm_stderr": 0.013659980894277376 + }, + "sciq": { + "acc": 0.911, + "acc_stderr": 0.009008893392651526, + "acc_norm": 0.894, + "acc_norm_stderr": 0.00973955126578513 + }, + "piqa": { + "acc": 0.7557127312295974, + "acc_stderr": 0.010024765172284242, + "acc_norm": 0.7682263329706203, + "acc_norm_stderr": 0.009845143772794046 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/rankeval/4b284b84bc4v2seed2_3_lm-eval_global_step80108_2023-02-22-18-53-17_3shots_backup.json b/4b284b84bc4v2seed2/evaluation/rankeval/4b284b84bc4v2seed2_3_lm-eval_global_step80108_2023-02-22-18-53-17_3shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..979c2816027792946efcf70312b1d8dc65be9fe4 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/rankeval/4b284b84bc4v2seed2_3_lm-eval_global_step80108_2023-02-22-18-53-17_3shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.319, + "acc_stderr": 0.014746404865473472 + }, + "anli_r2": { + "acc": 0.341, + "acc_stderr": 0.014998131348402704 + }, + "anli_r3": { + "acc": 0.3566666666666667, + "acc_stderr": 0.013833742805050722 + }, + "cb": { + "acc": 0.39285714285714285, + "acc_stderr": 0.0658538889806635, + "f1": 0.224400871459695 + }, + "copa": { + "acc": 0.83, + "acc_stderr": 0.03775251680686371 + }, + "hellaswag": { + "acc": 0.4819757020513842, + "acc_stderr": 0.004986538243846636, + "acc_norm": 0.6331408086038638, + "acc_norm_stderr": 0.004809626723626843 + }, + "rte": { + "acc": 0.5631768953068592, + "acc_stderr": 0.029855247390314945 + }, + "winogrande": { + "acc": 0.6045777426992897, + "acc_stderr": 0.013741678387545347 + }, + "storycloze_2016": { + "acc": 0.7279529663281668, + "acc_stderr": 0.010290888060871242 + }, + "boolq": { + "acc": 0.6162079510703364, + "acc_stderr": 0.008505584729104983 + }, + "arc_easy": { + "acc": 0.6292087542087542, + "acc_stderr": 0.009911292822056923, + "acc_norm": 0.6136363636363636, + "acc_norm_stderr": 0.009991296778159617 + }, + "arc_challenge": { + "acc": 0.2986348122866894, + "acc_stderr": 0.013374078615068756, + "acc_norm": 0.3225255972696246, + "acc_norm_stderr": 0.013659980894277376 + }, + "sciq": { + "acc": 0.911, + "acc_stderr": 0.009008893392651526, + "acc_norm": 0.894, + "acc_norm_stderr": 0.00973955126578513 + }, + "piqa": { + "acc": 0.7557127312295974, + "acc_stderr": 0.010024765172284242, + "acc_norm": 0.7682263329706203, + "acc_norm_stderr": 0.009845143772794046 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/rankeval/4b284b84bc4v2seed2_4.json b/4b284b84bc4v2seed2/evaluation/rankeval/4b284b84bc4v2seed2_4.json new file mode 100644 index 0000000000000000000000000000000000000000..b2fd5c0961d0ed108c95085b66899c7342303c77 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/rankeval/4b284b84bc4v2seed2_4.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.32, + "acc_stderr": 0.014758652303574888 + }, + "anli_r2": { + "acc": 0.341, + "acc_stderr": 0.0149981313484027 + }, + "anli_r3": { + "acc": 0.3308333333333333, + "acc_stderr": 0.013588208070708992 + }, + "cb": { + "acc": 0.3392857142857143, + "acc_stderr": 0.06384226561930825, + "f1": 0.18571428571428572 + }, + "copa": { + "acc": 0.84, + "acc_stderr": 0.0368452949177471 + }, + "hellaswag": { + "acc": 0.4788886675960964, + "acc_stderr": 0.004985331652408344, + "acc_norm": 0.6372236606253734, + "acc_norm_stderr": 0.0047981844631563575 + }, + "rte": { + "acc": 0.51985559566787, + "acc_stderr": 0.030072723167317177 + }, + "winogrande": { + "acc": 0.6227308602999211, + "acc_stderr": 0.013622567928799501 + }, + "storycloze_2016": { + "acc": 0.7300908605024051, + "acc_stderr": 0.010265413503221462 + }, + "boolq": { + "acc": 0.6226299694189602, + "acc_stderr": 0.008477957863309996 + }, + "arc_easy": { + "acc": 0.640993265993266, + "acc_stderr": 0.009843424713072176, + "acc_norm": 0.6233164983164983, + "acc_norm_stderr": 0.009942848077476165 + }, + "arc_challenge": { + "acc": 0.3054607508532423, + "acc_stderr": 0.013460080478002496, + "acc_norm": 0.33447098976109213, + "acc_norm_stderr": 0.013787460322441375 + }, + "sciq": { + "acc": 0.915, + "acc_stderr": 0.00882342636694232, + "acc_norm": 0.906, + "acc_norm_stderr": 0.009233052000787736 + }, + "piqa": { + "acc": 0.7546245919477693, + "acc_stderr": 0.010039831320422398, + "acc_norm": 0.7709466811751904, + "acc_norm_stderr": 0.009804509865175505 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/rankeval/4b284b84bc4v2seed2_4_lm-eval_global_step80108_2023-02-22-18-53-17_4shots_backup.json b/4b284b84bc4v2seed2/evaluation/rankeval/4b284b84bc4v2seed2_4_lm-eval_global_step80108_2023-02-22-18-53-17_4shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..b2fd5c0961d0ed108c95085b66899c7342303c77 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/rankeval/4b284b84bc4v2seed2_4_lm-eval_global_step80108_2023-02-22-18-53-17_4shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.32, + "acc_stderr": 0.014758652303574888 + }, + "anli_r2": { + "acc": 0.341, + "acc_stderr": 0.0149981313484027 + }, + "anli_r3": { + "acc": 0.3308333333333333, + "acc_stderr": 0.013588208070708992 + }, + "cb": { + "acc": 0.3392857142857143, + "acc_stderr": 0.06384226561930825, + "f1": 0.18571428571428572 + }, + "copa": { + "acc": 0.84, + "acc_stderr": 0.0368452949177471 + }, + "hellaswag": { + "acc": 0.4788886675960964, + "acc_stderr": 0.004985331652408344, + "acc_norm": 0.6372236606253734, + "acc_norm_stderr": 0.0047981844631563575 + }, + "rte": { + "acc": 0.51985559566787, + "acc_stderr": 0.030072723167317177 + }, + "winogrande": { + "acc": 0.6227308602999211, + "acc_stderr": 0.013622567928799501 + }, + "storycloze_2016": { + "acc": 0.7300908605024051, + "acc_stderr": 0.010265413503221462 + }, + "boolq": { + "acc": 0.6226299694189602, + "acc_stderr": 0.008477957863309996 + }, + "arc_easy": { + "acc": 0.640993265993266, + "acc_stderr": 0.009843424713072176, + "acc_norm": 0.6233164983164983, + "acc_norm_stderr": 0.009942848077476165 + }, + "arc_challenge": { + "acc": 0.3054607508532423, + "acc_stderr": 0.013460080478002496, + "acc_norm": 0.33447098976109213, + "acc_norm_stderr": 0.013787460322441375 + }, + "sciq": { + "acc": 0.915, + "acc_stderr": 0.00882342636694232, + "acc_norm": 0.906, + "acc_norm_stderr": 0.009233052000787736 + }, + "piqa": { + "acc": 0.7546245919477693, + "acc_stderr": 0.010039831320422398, + "acc_norm": 0.7709466811751904, + "acc_norm_stderr": 0.009804509865175505 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/rankeval/4b284b84bc4v2seed2_5.json b/4b284b84bc4v2seed2/evaluation/rankeval/4b284b84bc4v2seed2_5.json new file mode 100644 index 0000000000000000000000000000000000000000..dcef3076cb7d921944330ebdc2457b0e479bd084 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/rankeval/4b284b84bc4v2seed2_5.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.34, + "acc_stderr": 0.014987482264363935 + }, + "anli_r2": { + "acc": 0.347, + "acc_stderr": 0.015060472031706617 + }, + "anli_r3": { + "acc": 0.3325, + "acc_stderr": 0.01360541734571053 + }, + "cb": { + "acc": 0.32142857142857145, + "acc_stderr": 0.06297362289056341, + "f1": 0.1621621621621622 + }, + "copa": { + "acc": 0.82, + "acc_stderr": 0.038612291966536955 + }, + "hellaswag": { + "acc": 0.48008364867556264, + "acc_stderr": 0.0049858213361464, + "acc_norm": 0.6368253335988847, + "acc_norm_stderr": 0.00479931720990201 + }, + "rte": { + "acc": 0.5595667870036101, + "acc_stderr": 0.029882123363118716 + }, + "winogrande": { + "acc": 0.6179952644041041, + "acc_stderr": 0.013655578215970424 + }, + "storycloze_2016": { + "acc": 0.7279529663281668, + "acc_stderr": 0.010290888060871242 + }, + "boolq": { + "acc": 0.6214067278287462, + "acc_stderr": 0.00848334171802448 + }, + "arc_easy": { + "acc": 0.6477272727272727, + "acc_stderr": 0.009801753933112778, + "acc_norm": 0.6199494949494949, + "acc_norm_stderr": 0.009960175831493124 + }, + "arc_challenge": { + "acc": 0.30119453924914674, + "acc_stderr": 0.01340674176784762, + "acc_norm": 0.32337883959044367, + "acc_norm_stderr": 0.013669421630012123 + }, + "sciq": { + "acc": 0.918, + "acc_stderr": 0.008680515615523722, + "acc_norm": 0.914, + "acc_norm_stderr": 0.008870325962594766 + }, + "piqa": { + "acc": 0.7524483133841132, + "acc_stderr": 0.01006970396685711, + "acc_norm": 0.7747551686615887, + "acc_norm_stderr": 0.009746643471032136 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/evaluation/rankeval/4b284b84bc4v2seed2_5_lm-eval_global_step80108_2023-02-22-18-53-17_5shots_backup.json b/4b284b84bc4v2seed2/evaluation/rankeval/4b284b84bc4v2seed2_5_lm-eval_global_step80108_2023-02-22-18-53-17_5shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..dcef3076cb7d921944330ebdc2457b0e479bd084 --- /dev/null +++ b/4b284b84bc4v2seed2/evaluation/rankeval/4b284b84bc4v2seed2_5_lm-eval_global_step80108_2023-02-22-18-53-17_5shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.34, + "acc_stderr": 0.014987482264363935 + }, + "anli_r2": { + "acc": 0.347, + "acc_stderr": 0.015060472031706617 + }, + "anli_r3": { + "acc": 0.3325, + "acc_stderr": 0.01360541734571053 + }, + "cb": { + "acc": 0.32142857142857145, + "acc_stderr": 0.06297362289056341, + "f1": 0.1621621621621622 + }, + "copa": { + "acc": 0.82, + "acc_stderr": 0.038612291966536955 + }, + "hellaswag": { + "acc": 0.48008364867556264, + "acc_stderr": 0.0049858213361464, + "acc_norm": 0.6368253335988847, + "acc_norm_stderr": 0.00479931720990201 + }, + "rte": { + "acc": 0.5595667870036101, + "acc_stderr": 0.029882123363118716 + }, + "winogrande": { + "acc": 0.6179952644041041, + "acc_stderr": 0.013655578215970424 + }, + "storycloze_2016": { + "acc": 0.7279529663281668, + "acc_stderr": 0.010290888060871242 + }, + "boolq": { + "acc": 0.6214067278287462, + "acc_stderr": 0.00848334171802448 + }, + "arc_easy": { + "acc": 0.6477272727272727, + "acc_stderr": 0.009801753933112778, + "acc_norm": 0.6199494949494949, + "acc_norm_stderr": 0.009960175831493124 + }, + "arc_challenge": { + "acc": 0.30119453924914674, + "acc_stderr": 0.01340674176784762, + "acc_norm": 0.32337883959044367, + "acc_norm_stderr": 0.013669421630012123 + }, + "sciq": { + "acc": 0.918, + "acc_stderr": 0.008680515615523722, + "acc_norm": 0.914, + "acc_norm_stderr": 0.008870325962594766 + }, + "piqa": { + "acc": 0.7524483133841132, + "acc_stderr": 0.01006970396685711, + "acc_norm": 0.7747551686615887, + "acc_norm_stderr": 0.009746643471032136 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..560652725f379771ece058bc34b1ed664bed5123 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3369320d50b68a7375b32663eae2167c13ddd58f917ebcdcc2502fcfab7f15a0 +size 199058647 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc22b53504b58114d817b96225b4435b1e9be039 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:895bb01634be6e2b4e90b0dba95828813a3064de292887794dd0542ff2e2dc8d +size 199058647 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f98fda42972cb3d0e134541a64a83d76ec8750f7 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22e4d34d5201bc8b77cfe4d6b8d1bfa40a0272db66ce61d8d5f434ff4d05fa05 +size 199058733 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca3ede8f11d7174691422db51172b9e47a029008 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e4d69933fb033cf784427b7e687bbea97c89cd91d227b8d0379a72ca586b17b +size 199058733 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d41fd106e737471199d933d6bc902b762e35072 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e045e372ca847ff1e22f8ba76ed20d98714519a7b0d8e348ae2c1377c287c7e +size 199058797 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..46950e71f29254a3e1f287fd26bc96c75d4a8a03 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f0e02ec80cd094124c5636c2f960a1c552fab5b72a67cea727a8a6b64c5dcae +size 199058797 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..324da18ae350967bf81116f6596ed8afc8ccf20f --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c32f7f191e7f5bb63448d17e59168a0b8302f6bdaed906d0737b549ea2debc47 +size 199058733 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..97f18f81640a96a35c4d51aea87874c864b7747f --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3f28f6f67a88ba4c538f097750e915d71a1c560acbd39d77436a1eba7c0e130 +size 199058733 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..67ccf060d09d977a61bce19e8962755b1ec94aee --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:008e867944a58fbcc935856907fa5792e8b4f88714433e736b8c493c947b9790 +size 199058733 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a55bae5615195163301fb1fa150f77cca1aec492 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b110f2121398cdcc0ec6602dc07fc22e61ad424693f69f82fae30097ce6e8eba +size 199058733 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..27addeaaeb9df926bf8752f39b51802bcfe758c2 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc12511cc931d2053e164c202ab41b7ac155e5e80fdbb9dc224282f16e5d453a +size 199058797 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8c42d4bcec4a38cde5811499fb7c564b5b21a6 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b21da9730d83fabd11e56d063e75e3767a0920404fe1b5c030044977424e4fbe +size 199058797 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5508adddc3cca2659bfab610683facca803c2d4a --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9430bfae3d58a4643f94e17fb576bbb9ad2c0464368046e4121e350ad370cdd8 +size 199058733 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29bc5e57140a632d9a4f636f22705933fc570dc6 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1a71ac1e68ba9e29d7f07c00119dc426305324300a168a66c66ebdef76aebde +size 199058733 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e3a91a447d62141e873e6f222d81e5b3d9f67d6 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1f8afa4242ed57e16b13a0077f1049f2441f8c09105fe0b7d6a2d58a7f6cfb1 +size 199058669 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..baba796c2b242a5d8ee959163458d3f616232375 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5771feea7bea428b7b0946d3d5e148bf0a76c4d5abc79b9cd963bcc14a41346a +size 199058669 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7a698d7996fb8d138389bb2aac9189db7dde81f --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0926c40a0b41cc84629e83c77ddd20ae4df3729cbbadd895d72495a6841fff01 +size 199058797 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca3518cfcecde193a5851cdccbe6cfc1beae157a --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09897658f2e93306db770441cb7490ecf28ad45f4e8dc66344b6a3e401db1e39 +size 199058797 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a93d738e691d6749153036a548d5b30ff52e3c93 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4103954465dfdcec18bf98aace81233df94334478196c46abc264933dc2ca836 +size 199058733 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..920071d33d50d1163e03fe9d60a619d47064f1b2 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2c988da4d40345b1fc4027fa6156642680d2e65c7c25b8a621353c2b5478d4a +size 199058733 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7448b099cba7c08937a30c1586572daba316583 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1793876d76b724426bcf2c57ea303209bb594747eb7399be5a4c15353c0fd04e +size 199058733 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b02fdb27f859a7cdf87b4a84e3837dd2111515e --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7ae0256587f471ce725804be0c4eb665441a146e8b22bada21c3086e1737821 +size 199058733 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0477ef4c13f4a393ae8bc88de44bcd65cf9a06a --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:793ad317b296e98d46df17feac3d171240102381e39732169073196c9e1cfe30 +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..24c23463d85eddf85756c6b711ed82c2229ee205 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17c7b3767071622c15abfae1ee7399ca2097fcd2e8dd0fcd0f305e475e213640 +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..41a437e35d6bae72f44e93dad3eda5d812f0d8d4 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55aa7cc7503e7ffc00128f7f0f29440a64b385aabf44691c203c13b37d546af8 +size 199058733 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f178d8a35f051a74f769ac207a2a78dfd89ec00 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f119fafd804d44da5f9f96832d5cb2b388afa371ebd372b5493d692723fc6c1 +size 199058733 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbd331a9a757bb68993ef200b39eac97f2156cde --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3c2a7f9b8cfe98ef241f64f424c242c44e7e2b4c39c60e6b53d0e656fb24690 +size 199058797 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9418a808e6007f7330072cf14b6d73d67cefbd30 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30fc5fc0c4e144234f4117ebdda40a6c27e104820689bab12a44ab0d3d94672b +size 199058797 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a3a2e2eb6fa02f1945fd2f07083533e34330e91 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0e57e76affd779d820a80fb1925c42278b7eb173965c47245cec29f5378431e +size 199058605 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ca5cfb532484cd6a2174386a64a96ec61f63cbe --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b649dc355697c5e360dacc4384eca6ffb6108d6d3049fa42490c9a6bb759b18e +size 199058605 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd5de4a60b87eebeae45666319bffef388b3f84b --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9449f8b31383df60546d42db9edefe0c110bd0dc23dd2a63a2db1a803a96775e +size 199058669 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..39f5c85bf3acf3cc615ea0ef7d43cfd0d795b136 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06d52af8e5f15b22b5047f2ad5209af78b12c0587160279e72eb5f56135c27ed +size 199058669 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..299174bcfaa71828a4f79f15f4acdce5b8b341e9 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8858e890132979be00f78bd88a824688c991215780703519b381f47ae1c7f787 +size 199058797 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..01eec17ab88ba089be729d1ad06f3bc9e106b898 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a306f3172083f78463f2c2802707cbcaff463518e783ff837a36a7fca3d5ce47 +size 199058797 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d4b857ad5a273d15cf7b09a5ee749302eb8d787 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:402fb9475ed0365388ae00ea6021d88a7e80e65cd0de4e5f0d1c318272195e0c +size 199058733 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bda671a935f24fed26aef9c119e227fc36f307d4 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdefc61e07e0ed29110e7b5bfae07ec39df2db6a889ad0812a3faea5dbcfce99 +size 199058733 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6fb4b595741ff40b299c9169bcfe0ec61cc874d --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e34ba9aa8e7f27494f4b476b6b2512bc3107cf47f90c113f318ecfe38a6a3d4 +size 199058733 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..036d060bd345e69223ad9e44557ec5ee2744d231 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6e7d109041616b66e1aa754f1226a91c53437d569492b472732317de3a10471 +size 199058733 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b979151306d75df53f016b3a5c4f8b4330812b80 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:470ac862bbb15685a7859f098969810f7e5ecd90d6b71e3da470972c078139e0 +size 199058733 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ca1060db9f7f97cbee4394d9a027669c3b4a9b9 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28f12d8a4e0be416a794612de6734508cfb1be9bdd4aab9642d8ec0fc1a33964 +size 199058733 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ca39b16ca17daa100701cda083bcdea8dc6884f --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51462643ff5b5a5e80f0e411fd78f152fbb697dc8a95f37fa8a1c20817e18c82 +size 199058797 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1f48f30f360b25415df39f7c50b52575b2a0ee3 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e847bf72e833e5d67f5ca578a2a6d0765ffc65b506ef6f0b6037f2300c32deaa +size 199058797 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1722635e5fdabe4cf478ccd4e89a1c78431a155b --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1ed125f8ecb9b0d569d1c4f9dd5553bfd35ec555c88e6e7a2d76cc4160c6a71 +size 199058669 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..69089842f30b86cb6273f21394bb8ef64dd3f283 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04c6b20cd4aeb0e48317ed0bd14983bc716458e26d5476ba1c44741e7c501f61 +size 199058669 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8301a0b6afccc623edf01de3f0a2a06aac56374 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5017a4fae257fea075f7d8589d98a71c5a217a2f6fc3b05db06831a01be32e05 +size 199058850 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..960863d154835d54caa349949048d1328dab7b47 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:374ce506e4c90913ba0f1d2c7a3098670a83e40d0774a9863237e6d3f73bd6d1 +size 199058850 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e3a6b396e9e74ccad6aacb095fca7c9e03d5732 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c15c806dec31e87e9fa230f873f2b5b51fd954bca98b368f64a94637cd02eba5 +size 199058669 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..90d2839f7a9e1a56a78043a929256e07fc249959 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2f8cef23133c32611b32f67cc570a443a6d71b121874bbd132af769595785aa +size 199058669 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e831673f1c0025c2e191c7bcfcf1da6355971222 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d602aaa31dec6834cb1b39208b78fd5c3ad8cdebfb75a01b4e0d7b2d810ca835 +size 199058797 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..930c8998c4b61ab364a9c5745ba200aeb11131e5 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abb3df4f7f2a9ca3e5116ad82e940411e4d7b91a41e499f17b9089f3cd801d15 +size 199058797 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..81fc563567cfda070d7ca1b31878d732a3811ce8 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00efbc04047c7af1e39d7469f5411239d8aab2f3ab6d1d6aa1a7a79d10d81ba2 +size 199058733 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..452a466b215ef70cba1a97a820698a812b64648c --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0035294e586ffb85deaed0dfc53a0e35de44ce63f80862a4f0f3971d37206872 +size 199058733 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa8bf8a9064c2d47a8ae21c58be33717c9dd0c59 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f4afd448021a30a32229a556cbe1eb42f7576d1ed879dfd13c6793a880b4b05 +size 199058733 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..527cc984c933316dc9f826880cb60e239941e46a --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccf71891e9c1da497af6cdbce14c32267fa771dc2f1e738df46403ae14333ea1 +size 199058733 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7d7af0c58485ffda63131ce0884aacca4d56f0a --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fd0c8ae34194bfab300d5a3f886b3eb97940634af5950ec8437f5de756c939c +size 199058669 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dbba6d2d0cd78f1738ebdd8253655de7ed5d1e94 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41927eb87ce401ad1cb5fe474ef6ed599f32547e3977e40b7ef9d2d130cb1989 +size 199058669 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f44b453f3e914a86e396bc4e01e0f800cd3b7fe6 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d606f20581b0d81bead7447f260152b8e5f9e8d101da654071c82ad14ea9fcfb +size 199058925 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eaa34a911ff2ddfc814bb46508a7843dc9aaa1e3 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4596d36b75c0fb15da7e00fc2927d20dcb2b039a0c75e0a98645783a563d8832 +size 199058925 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca61f5ddb093131207a201225b02db9555c1c3e3 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3c60059bdd85cabe200ce19583847145c428448b725c50a3916ab6726737310 +size 199058605 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..71b15dbac4331e985254e50ba9bf75f4adac0fda --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22ec13a460b4caa1238670b59458317a29060398e94622c5b361ca2d68642a9f +size 199058605 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..943828a3fa09785861c81117759117c4f3f7f4fa --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9670d8ae64ff95384a70d4e1302b7620e5f400537bd64d845d801f783be0d9d +size 199058605 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec2f30f0cf4fad1e6938ea5f5e46881f0df0bfad --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3d748bbbf188966b10964798a681f0034554dc89b4056359d0dbebcf52f866c +size 199058605 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..db7165e18c485d928ff3aab3c978e457dd8cbb6c --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74f52414bb5da125df6800251fa7201adc0fa4c97acb6572b7008947028fef1e +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ca6c4b269b44668856d407ff35cdf3704328f63 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e10f35afa686c2547c49f210021287ad86140437973dce6ab6241f24f8b38b74 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f7a48d9fb67ccaf93208dede84f769e50ee7dc9 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:249d1b8a94aadf5febbbc68b44a9aedf67cdc56f6755426a99f93168eba8bc7c +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a44a49c1c299f61f9b1dd25f0cbc75ed0e913d74 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:093d73a909f75baa3409ad8079fc788326955e577f8c0a54422ea6e05fe750bb +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b8499aaebab324c78c2bcb4a004785f5cb720b4 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bd5459253be363485880a7673a0a93f9286e68b21c232e0e136ce90b1adb399 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b813238f8be7edff31793ea7a650cf84fd20650 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc9ab32fdec6777e15660961406471418896b4c6d44bdb1f217cc7227f6389b0 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8652a28c78dd6a5a3c0f9b2ee296b27e2c80ee16 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c65b31aea42590cc17019cce2777df529c029f65ef56778370c4d95f9871d2b +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a48b4fb1a9b71b8fc6157f97f70c2747c388538 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:caa6b4aece704d7d84d58f746c7ec1fe33b247471ca4eb7ca239e902bc243347 +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bdde1e68e0ab3fc268aaf659e44f8bc4938aad2 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6096d4721fbd37622d5afd6fbf8dc0d81a1cab2dc807fc0336a69078784b90a5 +size 199058786 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dbaaadc518d8b36bd56e44d2948f2283d12d2e95 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:382ff93c50e558c75289fe2287a071449a69b2146bbc441f33944fe8380dc9b5 +size 199058786 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6fd506ac5021c51e96c680c719f61ca6380b2fdb --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b83dd0c74ff338519de3bd72d5a8b51073b5a9f87267702b175786f115b53bcd +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..560da19cc9cc4db8a6b1257f73bb5493d84dd1a8 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2217d36f3b687912c1a725b353a6f0f0161c91352c4c4e31c1bf28a5d72a15d +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..433e980819ca56e9380fb43bac40b6d0e4df4d9c --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:620712dd9535ddea6481edb8b2ad00654224ca9a813523b0425b2ac629e167ed +size 199058978 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1a3862a706b6b8486f83e388fc0690aa062559a --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8591292914d238d569c59a54e0f682246a73f7970437c96842046d26b47bbc09 +size 199058978 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a97c6eda663a424375bc40ea8acf009bf4a606f5 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a744e21764ba99f855f6f8de04d62226582e37568e76101d8900b9dff95af864 +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9c5d06c91827d2968dd4d57b63319b30c9526f0 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:757d2268fa479890bef0d6426d4e3e1e3846106f39d3459d74db6596d341de63 +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..707ebf4c3143f02ce8ef6c581eaaebf9b91775eb --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2fabdcb458935e31fff97626c91f1c60ad23b5e9db40b60f6214da102011ab2 +size 199058647 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..456768848ce33702930c6c57d932a399b84a90d0 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bf3c621449a696661a9ee7cc27340627df14601a25da0ad2a8026c01db687a3 +size 199058647 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbb283a832ae92469b2a0751024a62ea10fbb8d4 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9fcc59d45da305cf7d63f975c448cb496c73f258d4437a1328d95e8725b7551 +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..290e2eaeaa61c040d542a371374a2b1ec5f78557 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a91ddc489b3d930405c0fa92f92a22ddbf07ba5bb94497cb9bd76d7c8401897b +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b16f61ad73f79d255f718911225c2a1ed989ead5 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d2decde0229fa1750223789b85e15b243ee6238197415fd421f2f1c11fd1965 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..054eca7fc319bed4840f2bc41d4dd9b0976e614b --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2849e5820f76d664e058a10e3a4941888f5c7221a959e8846215cd0e80116a46 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..41c1c5dfb3ea7bf21907faed101d902464309bce --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2fd8cb97817313d7910575e065c1978c68e99da15389216ae3812b76d3e803f +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..19a01654e12b0ec14cf0863a9b8247997bc9f7fe --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fc24201eb4a3aa790fbfcc647259ebcf276c3711e861dab1895e1d9216dafd4 +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a76cdebb8815ae8b1d2ece1d69ee8db7ac18d3f --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc3bb784add11e45c05f2e3b1a5da74f03b1845b59495401c1460a8aa9e62899 +size 199058786 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..105534bbf99a1893de8d0c8968d02c038296efc6 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5edeb5f52d81bd50358e8f380a985a34e71e39d2c837789849212e4bac279ebe +size 199058786 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..280f2fa8e90e3e0545196661d49ecc8df7629d08 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b224a9c0a99db34a645b9cb19daa4e0f21581ca9639b88c5fe972f391a3a1c08 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c9bfd3a2eea7c1fd019e50092fda7388cb06f20 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49a96d2e4dbc0af68b9cba8b9b84a2e7d73ddc24d46bb06d5b689fd7fca1115b +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9515eb696b0c6f21a68217b430fb092a250f19d5 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da7a39b65c720a538312e790b59284bd84dfc0d2e5a5e553ec5734749f3e5b84 +size 199058850 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0402d57030fe5bde97b845b5e26b6f5ddac1653c --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d4d7b8ab660d18599ec6284bd81e3ee37015ab777b0924786dc25d3876bcfcd +size 199058850 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a5b36b00b2e34fe83f1c1e1a6dd052b5ab770a4 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33be39d2a4092d74d2a16e7bf2f130d1cbc9761e79b20b74c31d87d165b67713 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..164f56c1c61ea264a9ac27552f09b6a7cd16ef33 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd33126f58262ee2af61882fbd2ec90284be7ae06cbd5702e1df97606231032d +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5abe0f12ae5675765ff39b7130eab367d74026c --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84adeb3dd5833e6b95b227a3c7ffe3a9cf77d5dd947ae7cf17e8155abc1793df +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eee11b12ae011553bbe3adaa97d0ea069c5c05a0 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7bb2c750a626cba7560b7fd45042ec356e3c4f0223837f4ea014df450bdfabe +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d816f0de10fd10aa5bdc26a75c65bddf22e9c15d --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8e39e60b22ca15e35458c1fc5ec882d55e7b84d0646d570e3db5879395e4c15 +size 199058594 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e9a036410881fa41db2112f6ddf68b5709e55fa --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbc39220a2bce74ff9003f81fb629f1c8591f66e08af30eb66831970012df611 +size 199058594 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..682b794764ee1bd2360ecc98b6c51628ae22901d --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfd6ea2eace1d398fa8bd725e3cf0567e4eb1d17fe48ae266d85a6ab31daccdd +size 199058786 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e2798a0cd3a699bbb32c1a0126cace83acebf76 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc1277877a78ca9cad95a65609c6765d0a6bbe3fb5c756bdd3209bf941b0a8d1 +size 199058786 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..366c6811527d6fde6d589b7692552e0e371f7e19 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29699e75e5e77b37f8c7e93c142df2b18f13ec864e419d2aa5d8f9fd8b4524db +size 199058711 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f775b49ddeff7eb96d858dc1cf37b9aacaf2468e --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3931a5f246db39ddd742443b692f106127eaaad522fe29f60089fb6be5bfbd6 +size 199058711 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d1a95401c87bd26ac48ba958ab8e29d655dde47 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:018860309ddb11954828af2349e57c24eeb67ee9d9d9c2ff9b43f62b47b44697 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..68f2fb2b094e493e06554bc040f1fd193a8bc3e2 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b77c0c43867c4da27e0bc83e44b939068ea7b295e09f48e571ebf978edf3f59 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b87275f8b9dc842c2e2f8eff1f667b74e24cb72 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92fec803c2e39b7c227667826e3b43d23ee0f400321e504f7aedc10d9876d832 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..81b804cc594103e13dde7fa27021f91f80d1c585 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:115c43a7f11ae2bb76eb9b4f57ca1091cfb7133649d647f761277d7d006d03a0 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..110969e3b2c02dcf0267de270b751f683da6d168 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:553ea80f43136389993c360400d51c780fcca352710266ef4761d6ed1391eb55 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ade02914f0346e9ad4b9fd09e5d61b841b2d8470 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c701476800ddc29b48cafd750316d865bc2467d2f860b2d6cceb6c8248d4cfec +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77fd46c6d0fb65f74dc8fa41fc5fd7b8df74afb7 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca190ff3a8ed54beadf01d3e1cd4dbf43e90c7af0c4dfb909f49df1f6f3102a3 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bba2b8e1d7e54d77a7c539c2f8999903dbc3f37c --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2b3d0666956eeb7291a9ba4491d1f86f09c101e3d5b1cd995479900da619dca +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7775fec218b89029cba503d216bd11f772ac71de --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32aaeee5108e184d3615bd39bd94990d7f65500c8c955eeeb07c1f9d928fb362 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c81e00261a7fbc2fd518e89541265c0c98649e7 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cf4563f353c0e987634361f2da353249a2b83adc46e87eccb76d626ee235835 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..82270ccadbd9be8599e9660839cf1ce84cae42a8 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0bc5936a3ff4a6f871358f4742dee30f35f08852bd0bd4c8ead6938d5d93303 +size 199058594 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..184d9b60fb8ef67347d100d792f1c0ac181651bf --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc462e01296cd4462fde09aef9a12b71a394d147229da9e6c5bdd18b57b4c387 +size 199058594 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5974839ce7c9bd36a931dfcd206e8b9d81df7521 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e116871c7680a30f9248efe0a48b61bb70bbf1ac2f9bcc47deb307598f31fb6 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de435dc60f9264011bbed71e67d3ecfdaed3ff6c --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e2d68eb96ff0b573ba4bf1244035a64b7fad444178d61aef1a87b440fbb1bcd +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa4e51c2ed9fceef389e5275245fee8b874988ed --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69f78395823bd6ac49c8724871328e5db7f21f9a2d510eaf15904a8796475c6e +size 199058786 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c81286782337d93e14e42890eb82e9214e7ee8dd --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3b1209abd0e37f6852a0b12f90cbbf01df29693809b9dd41da0cb33b29c42f7 +size 199058786 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed73f3c067dc47999652d6bf47af344f55a077c8 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8410dbc5cc9dc46745f8407b666315d734007f61779effbb76e9873b88e242cb +size 199058850 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a21ad8afc35316b368a0015c735142bd87247cb --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3943d65991570cb2d79395c80d9e934d1bf0d3ab46ee4e265ee5730db7204523 +size 199058850 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..80681f03fa291fdf95b80012c29e2135ae7fdc45 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eec828840c3417ff833fd7090e225d7d8d14dc6cf99167c57a91ab3de1a3a611 +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e688b1413b8379b09c858ded91c73e41fd6bb532 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa7a64682ef80ae2efee2c0ccdf0449a42bc6bc13638a2a79dc36b1ae43fa701 +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a234f8b02b96a3fcac5a9521c9952a69b32f69f --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:038ca33402c2cf9665bcd5e3c00497b923e23d9bc58ebab71c296f2685be8fa8 +size 199058647 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f0e0d377817d41cf4d5294bec59bce6f4c0f383 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2a9da85abedeef9be5b13309410adec3b0ddd6da55d6c2861b28bb278abd9eb +size 199058647 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..913d822d9ad177b71690fd8a054f557ce856d2e0 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6fe5d68979f4cf38ae03382fa705bbee2b4903eb3c13089178610eb623020dd +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7983234045b64569a6353d34bad2d3f82f174d68 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f182e98c1d0a787af50f883da1e3cad54cfd463af1906e1d9e3609c38be31dc6 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e23d8fd1ccc51495499ad26dbcdc0d00c4e81fe --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3c6abd706ae32315c7461df113d4c7cdbdbcf08a767e88f65124701fc42ee10 +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a69639c917870439040bf94eccc54066a89f629 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a95a9ef1c9ce1c28fa08dabc8eb668b6bb896ab2a11b882430b119b3969b92f +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..04b40c80e3dc6631f745a3e97203aea22bc729df --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58949846108fc4b132501b7bb2dbfa70a2f96106cd56b3ee7e42a70fa3b7c252 +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a952c1b60e1dc9fd50f82d3c7d6ef6f54e89255f --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd4cca28ed656debd8cb5f5252d940d5e73bca0f49bf7a6e0fede730c571c046 +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9908a7a679cbda37a310ad3401a4003b14eb866c --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c50ff5a63050309fdf41a5936d2df7d904a2884d077300b4bf08c4b5e5be4234 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..af19d1fe3db781dae39e3e1fa6319c210552df53 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3b76832dfc1b62769f162858f84ce54562e3de428fdf5fdecbc441b3d44d2ef +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ae1b20c210fbe4806a01cb5751151698577f926 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f07a60afe5f3523eb37e31716300aa6767db6ed8c0bc5b38975e0e44bee1aa1f +size 199058850 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..584a38ff34cc6dcc0bc2c3848bdebdc021d77850 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ef622c5d6013d280f0613d465cfcd72a6a3ca56214833061bf3156caa1afebe +size 199058850 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a191329e44154e1757e4e74a0e357f7d8a95a9f --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b17f7afce30c4555b9de9f6ee5b3c19489d39818f06a19508a34892af2654671 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..37cc092bf3b026571cf60a4acca874f82ca27a8b --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9eef01a9b4dc3525eeaa800b02a488820dd81f04726cffe208f8b9e9cb015609 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a3ee0e757f36bd9f1a38d75696eb54dae267db7 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bf37b148ac2164122b18cc21d731d98ba98569b02ba76e96252a16b0d0ad6fc +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab8b739494afc55303a6d1280d5e7abbdbb0ab37 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6facb2aa04c1f01c82f25d195c551b44310deab2dcd5ed30107d399caf4b5dd +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d8915f445cbb1a15d668c7ef937aad9f1b8d7fe --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8447419d9947aa8812e7d3b7f08098b186e7b90ca741117536b186dca014414f +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d85845e3caea1d1edd4e59c57a8bc4f55b8688f --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfa91dc0daa1f02e120189435306c763e8065e6728f55a4d4ac48c9aca3656c3 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6190833295db3e10deecd2d79e55e019619575b6 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:374d0274a6b03090eee9855b6182fdf299c5e293688e7deffe089da0cd93fd6f +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a928531723dc9c994ee76efc67fe2216c88667c --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:213ac557e75ff9335e1cd183f97318ab664d8af5e8e814d747f8d5384fd8f331 +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..32b15e3139b90516391ea01d59515d32740f89a1 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:966c2fd58df4ef2c3e94bc50d7db3778b415c3f6bf5e61c318f1f8edc95e6dbf +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..616df96ad66b624f5fd974c997d15798305b6baa --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:882fc7d8816c57d1fb52f30873b51b9e622112d0c9975e54bc1b12f9d956968d +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b817f88b30448e3b643f02415100f62aa0d59757 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:553586c0c5fdbc55c4e5c510b7a3551ffa15832ae42eaffb2c37d6e57f2e02cd +size 199058775 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..124ff7cebd79e77853d4f7e809035cfd683ffb73 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:573b9c29634ab99c956558a717d5293e470b565918e15380e8593f0268e10ed1 +size 199058775 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..17fda3a4a3f8719f3eaa87a084aeeaa69faf2f88 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e722460bd239dd8b1eb9d7682d2cb2ea926bc2b86749a5a08f176b1a17023dd0 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..73f98099475acec5d05c1a6c81fe14666a8df928 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcb2f1b3ba87fc0e6127b492fee068fbf8f055ccbcf869c3dafcce214bb40e62 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..82d829e035461fa3834fe76855b8249462323bc2 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b3fdac50d50985f046e5d41ac123d9f99b757dab7bdcb0b63999c0f939ec807 +size 199058850 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6464345f68a658c5348fadec1264d3b85520447 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78eabd109945bd69406455b854273c7b9959305d5a15b4c98dff7462685e47ad +size 199058850 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6030f739ee9b28c248f6eb631451fc39c385baf --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e35eff073a859638a777d171b051efcd20d1c40e234b2f8f3368faeb476c3ad +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b078e712b77b01707e87d7a36ad73a2ae5e9698 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3704200861f5334c51be8bbe9a0d167e2a7e9e6ffee132a082a8ca3b8fe5881d +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..141f3cc744710e4d3d2d022c6386f82c8c211668 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:440b4eb1a730367ecbc7c5bc5ee51720a94d96054231c252d8ee5adacbaa3666 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5af5f31fd3192a71b4b678a6f749a30f389c1b4b --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad643ba0a9548b469d62f1920fe056d76359b336f8197b288db5cb667dfe2ed9 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f670bbf6b90b433e00e0829d81630abb56b33f0 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d5ec81099c1ff2b2d9cdad5f983f796a10b6e16c2d8f02b294b6b4618c7bcc1 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..040cbe011690bc8c835954eeb69d31e0ac781002 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1a16a6d616a486859168deac893d251d660c225a77f8a2dafd5631b81281c7a +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d2004e10d091fd7d159faac22bde80cee335729 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbf7d09f010f88a8ea3157f3e7060ec09eec94f6014a936605e2d0f7d914c331 +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b981b5d7f7f3737969135cb4cf456a447511b76 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a54d2e142f8abd4eaa7c7f4c30f37250712fb347af448bc69e431a3f5aeb6732 +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c58bd977ab62670ce0df5de21d46b77e3fa58b9a --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa12d928cc59ca55766dc69699b9297ee4fdec0e6a9e5b569a84f97fba3c973a +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c62beb04cc6cc81ed90515af327c7ae821d9fba --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ceaed79440030422442b5d7610f6d05197ccabca26ecd4d3c54cb732f9b58ed3 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6be83011c780f86ba6e4f7ba755574fae9c6ac0b --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e45509e9fb3d598ec588f9a6aac6b2905f1182f9fce213777979a898e5ea85d +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d120282df68ff97c9d6ff91efa2866cd3d94454 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5a95550c7afb7dec2554f3dd9f53d49c332f817a0ab00caa2b954de0d02a151 +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..629b24ac8c5cb99ac4e9a4938f020a3712190306 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b171ac3873bab601578bd05d8c1c91031460227ca3ba368228a08f3339da08b +size 199058914 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3716a8ce1b8305c15ac3ec74cfd1763ab08d0a61 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02e8d59e037d272ec4e967c46ed353ac2cbccaa2e28f30ce3aa08964cdd0703f +size 199058914 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb592893e1af598454bbc20b24f4fea003dfd763 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98c5e564652fd343755f3784cc3f2fb9b3821d175a3eb943ec82157096fca1c3 +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7422b95763e8119f6f1280c682d6e2512963d35 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64ba6caa444a5fb7ecde354b29aa85314faf055b097a32d7861ae59ab5e5ebe8 +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..25131ac98d8e2a373112ad7f6f7672ad21013cbc --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd2037d30a025071b0faa62897854c1c3fbaf82b4dcbce4582c35e2d9bc36115 +size 199058711 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..53b7d1fc8528d0c8e50ff0c1916af235e0c16ab1 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ffecbcf44308cee60bb0079a5807f3c0886d9f147f4c5d622cc4cc7ceaf5484 +size 199058711 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..23b6746fe4c62e76c10eabd76090d971841f3c5a --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e4d067cc3d66bfd86573f60b4d80b0b8cf140239b7c84a382e64196fcfd56a8 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..235c6116909d7013e0d4267c612c8b0e8f57190d --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b609a7a23a0b639ec956b29a911323287c9bbf0430bdf6ff9fabfbbdfabaadde +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c342398cfaf5beba6a59322c480312bc7ce8241e --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53008e2645a7affe5932328bdcdc07a4f843810f5f7d9fb2987870aa44dd0ab5 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..11287607923930f4a83e09fba2a1bb5b5a2839ff --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3f81a06c5fd3857baa5bc9ef957074fa8f3128efcbee2ed0f826cfaec2a7879 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..96ac33f674307cebb551644b07d4b49b911e4cc7 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66839fe120a8084814902ad82e9b822121cdc3e4f50a36398cee2bbce1ed1312 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d60dbf6cc61a4e1f914800f681ad40f54eefc67f --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:020a51fb60b5c49b73ba834b319f7715d487da0e2ae4082e78d5af134a8a16df +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2ec951106038eb548541f94a59b5cfd25f87765 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca5ee692dde0bd98437320b5d36cd88bf501466e88226d95fd6dea2081d2292f +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4558946ab0d26f7f20ab2fa9859a35d7a7f058e --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5a50d02889a818b062c4aaf40d9f2ddeaf4afd31457c620979dbba726f62a30 +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4310b243c10f07198eccd5d888ce0e069ada3481 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fcaf47c63fb0b1f9b4bc7decf40ad006cb545f59ed69de68049474d9bb2e868 +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b864707624eacb6bab30803ecbc954555f6e60aa --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee8ef6ad11cfca68350e0ab241135f631c4d8bf10221c1fbe2817a458444de47 +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7aa83bb1d419d6240c077f6f1e2b25386f155206 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eadcc71cc5711c3c37c9174ee217455666d4694b37d79bd0b3c134c82c461ecc +size 199058850 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4365428b3d6ca6f856ca2715965c553bfc3dbf5 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb7e50fecb3fec0f6c650efd85c4cab7f3720c978b1272d38ded4855fdde808b +size 199058850 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..157374d009fa3bca01e02cb17722d221cad7fa59 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:101730cc1330ab49b43a245549b13b3da459f0cdbe6e33fd85713a7525637595 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..061ad2ff9f71d2e86968b72d196c47af56b465b3 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9788764e4e690a5f049ebfe59bfd8078e71b40aa6bb3b36235a06349e966f0b8 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5509457b6c9156018cc0852988be5e9e031fde29 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0c15fbfe7b56a87b9f49c40e3189e5f7fd86fab7c237d4e3a8e62792d6f32bc +size 199058786 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..979c89603c450c51588d4dd264268b83416cfe31 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bafb1a217c2972c6c982dbb21af89dcbefa3ca48cbf37538590441ec1832a448 +size 199058786 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc49fb060a82968c7ff10b2970670c48ef8ee536 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a3aa7dddd35a3ea85ce13686f3f0ff7444b4824c1386cacacb59d1acd804bc0 +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc4bdaefcaa27e8310223424511b0cdfcbe15bd3 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cc81dc58210a5ecb3a3b36d9c61899a504128d01b852cec99ea0ca7535be227 +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cfe310a463a9e35acadf3687dfc73e419940f163 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1049b564d6460c1d5383a4ae6e51f1f763efa0692fb7e80b97c4ebce4c8fe742 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..12ac1d4137523d13df40796865789c16fa5d6cb7 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17303fd23a792d9cf8245358d6cba45cd20535578b47ab14d24c8dbd86c089ce +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c06488ae5db8e8e51f6f4d6d37039150b303ad6 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ab5d56a58f3582597b0bebbf929fdb7eb3cc4aa74b83f8b0dd9ee62faf744c8 +size 199058647 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..667a7faaf1493a63f26b7171298b73d1653ba0f6 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4968a78b8d13cbbbbb359040c52174fceec9dd2309a2f4585d8aee117e4960a7 +size 199058647 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1188b0f52d11d82352859178a6a820002d52d7d8 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc7ee1cbbce1a539978e4de69924c00b65098eb1a367d1a36a871e24ff706205 +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..56de99796b74d6e43a8654394b3fe7ad72a863bf --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0b0e0d40a5a8ad2f03b3a47eb56aa352b5d0fca38fc5a7f14ced825cc4d7a71 +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..93721a1e064b1bd248e79a348e7b144da2b98959 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f2a183abdaa120fb6bc009f9153eb07a44e3fa606d4bef712c97fffa7d9cfed +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..42447124bf5342d92dfd994774bb63deb0df9a48 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f018e393d5ea338e8181cd64548b10fd2833bf8640c09ae2c6e63b6a1090bc11 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a01c30bb3965aa967bd6af11271be77cd33d4edd --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92b87555c7c45f7c1a230938aecace12ddf6fd0307399d86490487937c983c09 +size 199058786 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..adfaf58c764f34e933fed3b9d11238a83677fb13 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2bfb674df34e1d5e7b261eb3334f7e39abda83c0cc01faa1af9eedd4b5fb551 +size 199058786 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7eaf4c6f37c4eb1627d5f566c2ffc80771e91db2 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30ffbfccc45cb1ca153356aadc9c2ad7e9996be4ba4713adb3aef6307f26edc1 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3982eb7310d28c2777cf4aee66ec96cd7c9868d8 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d247685496486cfac0c41c09cb57bd4f01aeca86e204b660fe99975f9461c0f3 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..36535c0fb13ae06ca6129ce03b3bd346132778b7 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0479d6ef797e5fa9e364b75bb989a4cb3351e3505da95aba2149561e531316eb +size 199058786 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3bfb5cf89c1d5845d56c940ca6f494e8fe0db80d --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:029ee9990aa43d907bad7795901735ad3bd59a8b26fdae82349ec8e4afd3d419 +size 199058786 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3fb68c12ec38300edb893d8c878bf18c3de9514 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edcfbc3490f5924f570053be81c95c7bf2b6cd4b460af9c003c10dc21bcbaccd +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..83431d349c022ed5bb9ff28671b76b9ab3d0c3e0 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bddfb1bafcb22daeac518d077b5410d8b0c10e4efe5568a5dfc4a21c1f80ac4b +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..630083a5a0c47ecdc203f61bf9d6b2ef24cb67ca --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7552ec581cfe1c3d6b2e527e6b3e68f04f18fec7df77e7ee9b71028ae7409335 +size 199058786 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7c94fe4cb21fbc9e413f1440ebf44eb1c0925ba --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7eb972fe7da808e51a7aff8a46263bccb2865cd849dc572c60c3857d20328524 +size 199058786 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..34b9570e907105367e95987ebfb667d54e7d7b57 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:216b2da6c9a024b7898d6fabb875f59e8a5fecf8a9419e2c9682c6c6da7f6b51 +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..863b2679744e3e0a9d7e767ee3ac2124a4cc046c --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e44347482f958a6066e71d463dfccacdb55b3667c6d2d3272f21b6f5ffd0e0d +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29119dc049416bdb8e04bc5f91277daa566317c8 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5404b551e0590c76005587a620a59845dd5602e59d92520682ebbe976d6e9616 +size 199058786 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0fd3f746d3115ba7fb83ca2992f2963a1b427939 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:527dd6a9e4ca1916c76504de59d0fd87f20c9d96e18eb3ab5eb3449cd9b41aac +size 199058786 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ab0e5d45446063fda65bfa2c667a2ac2a78d895 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3095262a3603e6ec9391d7677f6d10a1791964c7184ae52b63daa31ebc9ffa7c +size 199058786 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2cde26814087fbba639351bc21eed1064ada474 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9e955de32b2f8450763bc8aff496c34f16feeb863e6bf37f0430a63db87acf0 +size 199058786 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b45d189eb205b2ecc1019807a41815cef5ff86d --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c62a369cc25a00d2d20b6848c0b1f55af8aa6b2a6df000d8f034019add14c242 +size 199058647 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa797ab30c3fd48584b7231c2e6087ef6886d06a --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d7e00609476b87012ba7cb1d4e1c4f39e411a2e1d637fca1a7186860fd3a1f6 +size 199058647 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..758f0c842d4b283f9966fda2489f3df4e55375f0 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cc2c38f9caf218773e1bcbcdb7ccedb322052f417dbce90fa6561b0f6b9b552 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7c1da92f820a749a8ea25c4d5cf53ac406a57eb --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cab6ebe2f87b905bf1ebc9b6493335c0ab6271efd01597477ffcd7eb2c35a12b +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c756533e9e3082e2b560bb3c64161549d571aa67 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83248857ca0e3f6fe244cb6a1646a460370e99ecfc8671c27542c3956daefa8f +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0adf2f3494b59008aed3a84d2cb7986b7ae551a9 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4056592d0745277f7fc36b1ade0773c0d134ecefe6fcdf91e193066d7a734d5d +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b625eb36ecc32622b1a232ab33d0ae87ddef4647 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f9c0e9e6ef4e8ff1d2331a862641d44665bae599078ed23140e24bcf1d0abd3 +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0838624a7c539448fd647667733de884eec5f774 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42c6b5279ca79e2b98de341261dc42bf03af93db7f12241848b3233b1b3fc4b9 +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..36a01212f752b38e1d536f6a435e2d9b80864a4b --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df35a1c5845ae539012964524060b5322080d7ab1dde93da65b0ac4529487754 +size 199058786 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aed11d3bbb8961b1780faa9023dd2e4c3bfb7d73 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61065194cb87bbc00f716bdbfb8099ab2421f71ecb730e19f62971468f5947ef +size 199058786 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b381f9f1c43241c036813a8802dc98cf25a87ab8 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d8b4ca9353109150ad1f06e9392e8e76c09912f65556ad1b9f22f8142effc9d +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..43f506e2e2696402172356e0e3dfc9f7a0910432 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94d4cef587fe310a0ddcdb8d63df188bdc7256a86df20557afab2093339b7945 +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..90ecdc542b3a9c6daec31d942d4b1c07883f10f3 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7faa518c696d461d7b5ad5b9b0fb4c130acd34d789087f9183af055bf9f3d8b7 +size 199058786 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..30a4ccc461ba5ad2d7b0f3d8c0ee1b40a7571580 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f7725154fda867ce6400afe885d1e1cc17d91ee2616b8ddfcd0d65d807ec3d +size 199058786 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..355f5cee12a3323e56649de7271f4ae5460ff14d --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71c6e99d7821ba8926408619258b51d8620f9baaffcc80e1437c9cb9de0e5d4c +size 199058786 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8d44e9451e1cd774e9f5422207b44064ba12e28 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3abe31ac6957f9730ebc8f54b94845ca16a9f2831d85d0cbfc8ac3b92967c50c +size 199058786 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..45ec88f0acfae4e3094c8fe75915f3706ccb29ca --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95a16a3c27afcfd8d0a38605696f0d0a987bf0cbb7c692c5820716629ad1f26b +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed8a07b7de0a8faf71b0f86df71504012dd49fd3 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fda21388e3028e3204d364712b116800f6f4bd7c493007305916c25877d4cb1 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..86f2b5e062a341dd9d2290ee06f255552858fc29 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27f74937b10050ccbb030b61080d8ada199bc9b840e7fba890e68157aa5f57af +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..280f9cdcda8445efd1b7549bebd3ffa0e9aed03f --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2881b42b8fd826cb87824b331140c26040d06ef2f14f79b57a225dc7aa8f3efa +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..63b0ccc5f802e042d1f0810b3e3a4db85b6cf092 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e81cbd49a7d4198970534d793660cae6cde124a4211f6cfd8254783a3a2c307 +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b64836abf6207ad32816d3ebc03bfa0f1b10bcb --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bd9138efc103cc5580b23ccebca9eefd4d3493caaf9d3e320e9be52d7120676 +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e01930ac520b51bd0b14c4ade191d228a466755b --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:595398c1e4114346a4337042142cad4daca44ce6d84d330ab7247650bd5346df +size 199058647 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f28dcba599278639ef2d4b925aa89450f67bdce0 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72adcb4e8b3aaeada18fa527ce7bd037123567cdb70e292046c3c5d57b16426e +size 199058647 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b561eee463230710f6fc8035cd5f3e83f1629859 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c45e30da3ba660de22cfd792e5ac4713957b7a2f8ce5984a2b5a5e57f71ce42c +size 199058850 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6b789d388b140cb1eb247ee22913ea700d4b88e --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26423ecf134c1f7d113b02d2ac4dc36e53f7c9848073a771659dac9ed558f420 +size 199058850 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3c07608c1cc83c24894399e9569e1c538d0c584 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc4ec71c12b5ebe422b6abb0771266eecd8abb97cc9980b8297301e091df8cc9 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..31cb0ef3b501e4b392ed484b6a9dd6b9db8a102c --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:681cb12fbb314a797c636c777837a4db3978c8e4ab3bde3f92f5ae214be13af5 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dba07b940670b92fdfbb2c1c0d9731cddfd14d0c --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a58bcd47634642560392924665b06964b3c17f3f5d81400ea2b8c1238354a45d +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d068aa258fd146b0004e60c442ea56c6e24e4120 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:050ceb8ef8aab2bfcbe0173c09e30718a417713d434099fc51305fad58a29682 +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..80cd991a4c120a515a8e1c72db7f630ef153e87b --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c56cfe32068266e3fe2f34276a2442e00db47e5269960b35529b2ab258df2992 +size 199058786 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8f243093a783e0734b4fe1163f803e5c96ca934 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38a82e7f3c13c776621813247c208286304b8fc12eef84a5bb4b244c26780ca1 +size 199058786 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3401681c48323fe39bab801eedd02b926063f60a --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9de6157dfdcc2d3b809bde1c841c3a5ab5ab3d5618d999f948b9775f0a4220c9 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e560b00e1457123fed6cec47880b5dd165021bd --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9b24cd8066f71b517c2821ce59ef526de1da63317c7c1e148822039b41a4dfd +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5549830a2cf8a7bd7d4ac4da9241c475bc30d824 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:749dda4de4168cf41194193ac3ef77351b9ee41f86ea3ad5231e386dac1d9119 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5cf7d862f212c6694249651eb29c40fe24aebd3f --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac7aad554ae265b6582547a1621c969bb1959deff1b4cba4756bf645e7ba0fbd +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..55fc19f1d1683d8cdfe0903f349e7ec0c599867a --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:039351ff8e5656d604837efeb8528ea6bdb878147bd2f3873f30dd4804a0b13b +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..49ab5c026e13516a602d9e4d6b79621bd8829e5b --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34c37727958180fa830d51dfa10f4cdad71dc94f0ead06870a9b02b161d6af56 +size 199058722 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1aa36f175e4950e840a60bc0e5cbb79efd447710 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71091b542fbfce32b219229aa141169ebcb40a6dd2148550445eae5b5e471c67 +size 199058786 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b67a84dbcd497ea28a5b9377ab0dac266a2cf6f --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bab91a8f763e52385eb323edc5e41110b229026198f1b13edf072acaf074eb70 +size 199058786 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a25fb225de3c62e55b9d528ddd099083e9ecf28 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86ca30156b4be3f0d84f01f4103ba36a95a8faa59af6ff1c1cd7fafc058db960 +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd4bae679e4380853c12b375638b31102c0ce851 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a41f8adc009f47fe73da05c29210a4b55d02613564525109ca3cd5348d14757a +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..251ac63f34c2d63fcc88d308d469c6d5d84e2546 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e0eabcba2c75efb020b9cda6a974d703118a69e47c4723e0a715bb2e1adb497 +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..03d0cb353b1b5df4ee791f6427debdf9a583a4f7 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7bd7e224f673c54c6a4e47093a7fe2e965fc7669c481c5074c1b9916ab09eed +size 199058658 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ee0a5dac7a2461b01b04cd1cdbee7f66d6d38ac --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2afac49b03c2256ed4cb70f6b3b6d0b7f59bb274a2dc3c0d130ef6490d13e18 +size 199058839 diff --git a/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ffbd70eeabcb1cba551b76752239c207d45794b --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ed79f865df9a577143f1cbb4b1972d543826224edca22bca40b791c717c2c12 +size 199058839 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_01-model_00-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..317122b51a882725c41addccd2f7e0e1aea84c84 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71bda5188dd1913d4a3166aecbb4e227eb50e5cb8a4684297b98623a24efad95 +size 167511299 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_01-model_01-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_01-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d336c92312cf1158a67b3fcf2848c9c4c5606741 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_01-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9445912011231e1f93d83344489718d5b9ec9e1af87c061575236fd0c061a9af +size 167511299 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_03-model_00-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6bfb5237c23f678bc00a5d3847ecdf67bb54502f --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:842280f7d82f22ad0af979e2cbb6e7914e3f3993d3df0baad1aae6fa884c2f92 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_03-model_01-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_03-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..16af7a2149d33a8419ccd25f603b3fc7f97a30f0 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_03-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1a361ebf72b1402e5ab37f4eddcd14437809d90b8f59b1e3847cdf9cf212632 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_04-model_00-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c028c44d013230ac55303e36837bcafcb280554d --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ff8427a8bf5c7dc21d7c44b4a7a8a1dfccb3225d08924900418e5c40cc74299 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_04-model_01-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_04-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..68b9aa72165ec7a793844bd7216b2e513a70ac70 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_04-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a17f4c24c21d7818d9b4b34dc7874a1ea8e43ad5b35bba2700c142ceb4fb6af +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_05-model_00-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d47bfdb8c57f1d4f8b8958451519620eda43373 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:866b742ad2d291e3b95cb19e9e8cad42c0df053bb07e994032600f40ca514cda +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_05-model_01-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_05-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..34573e695182b5393107a35531629c3b27f82372 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_05-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c44485ad2ee5f6ae1fea91d19fbfe0c33574231911c236cde3f0348a03f3a88f +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_06-model_00-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f8fee502a78a3d75e349d991b861dfa0b6924fd --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:071903d20ff4b34765213ff17142b5b7ede773885a3dc6bbe92daa7384ea3c02 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_06-model_01-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_06-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c560660d093a76dd8092a8ab4e308678c2a82098 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_06-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82b3697745b9171c705ddb9242a3a96f3afb032c888ad9793ad6f986bae01d22 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_07-model_00-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1ff79242df2a14ea0330b2a4a18c53c3f67683b --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbf23be36c7284e7ab375bf6cb45bdf383ae54554b843241024c6cf9aad560ec +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_07-model_01-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_07-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..15f87fd982feecf1f6fccf701c3389179f48b200 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_07-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe47e88d5b949f53124d3b508a43d7d2ed0455631fc1d3b71c315c149a1cd0fb +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_08-model_00-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..340619b0e4653a7ef40522b530f90dbad1fdedbe --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bea7362f48eb310a6171aee2799a70b2b72a2ae94cecd9c17373dbd8141343cb +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_08-model_01-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_08-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..629dee37b13be68a1b8854238931cefa98bfa7ab --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_08-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4c4e3f6a4f5b8744e49a501ddeb77f5368cd1b8f265f0b36e4232a0f969a425 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_09-model_00-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bfaf8aee8e210c4d8c9f67776b6408d4742196d5 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f915c7e5f64763d622f4d0c3d0bd9e327cfc2c699517321b122f9aa1d25ef88 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_09-model_01-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_09-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8865de888e0725a1719db307e1a6ca42d3b02695 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_09-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b15fc0566b5bc9c60d48b5f6b29e8585c440dc4dcf5b8cd5df87acd43d27954 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_10-model_00-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b4de7472ec62d14187568a1e2bfcdee96179d4b --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc05a30d45233ba58f88d0461f5d7ec4cfdb26fc239ad14b005e3603140e56ae +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_10-model_01-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_10-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b59e3b834a502aef29ac0b931ca857a0c5e93f05 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_10-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25dfb5ef7abb118c549b341cb256dacbfa9362fc91526e29f4fae05cabb3b897 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_11-model_00-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99c25e0f713049f947cad7b3c69bbb95ba5572b8 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c5b0a920dbb4e21758fe357aa13f49cae7cde0862831f3c36b741ef128055be +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_11-model_01-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_11-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..769a784c63d55836105057e99c91445f8a8f3f1d --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_11-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:163be9c0b3255693ba677e1d9e36ea7dba119a7c9cbe9e946b071521ae9a2fa4 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_12-model_00-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eaf718217d89e8e2b64ac9767184dc525a6305ba --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:808f39d5962d678adc0a7e2e56177c75cfd6d54d194aa5c391ca5a60a44f571d +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_12-model_01-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_12-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b56122e552556352e3d90defbf6bdde792490bcc --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_12-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9134e8da1b19f417d9d63563271b76d3fd3760e7319f01d25f1acf703deb8557 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_13-model_00-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..17464519325d889a85ef6ca78f12a21b4afec38b --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1af20c2a8491450a6bb256159180aafccdf7ad552a8c4783150a2706cca5681e +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_13-model_01-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_13-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6fdd283a4c90aabf3deba4c29946f9f9d2740ca --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_13-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1056adca8b7db56b1e02acc8827c6f7541a567c68c94b50b0b5172698d21a77 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_14-model_00-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca30ef4ee8e2a4ccc10ae7f4c657f2cf87416cb6 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:475e030ac97db75eff8f2dffb0c968080771b5d828f2deddab21c22453aec197 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_14-model_01-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_14-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e28da8de0f9b02f7db35cf65470770807e8af56 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_14-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:016f47032c42a3daaea2af2747effc2c22be1dab133894642e0c19c4da3b0df6 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_15-model_00-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2ad36d1c3b63bdefa7cfde973db17f5184ca9c3 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae56b4e72b05d1ea629e05f6cfe3eb114f4d39c7f1fe645edfa40b8288c202b9 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_15-model_01-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_15-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bf7c8204bf757c33e0d48d5817de5ab3c1ea220 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_15-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50938c37a3872245e116c7ef9a7bde21fa033bb28cc4d216f74191736a485b55 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_16-model_00-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..21a22d0c6fc79aca8d08f2a886647bc3cc7d10b2 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7f87a7ac6668a0721b2f4460e14de71db37e375452ab81619858ae478abe053 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_16-model_01-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_16-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e13fa6a3caad254d5a604423e6fda6384cdd972 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_16-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a46b2b27a33e3d3e41be8887e39ad430ce152b161a9cb070c03925df7bafe714 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_17-model_00-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d2cac78be00b7c7caea5e45f69f72eb78ac1f7c --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a90d476db516edc9f12a94654bf07014e99796150513efd73eaa11f1a96eaf1a +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_17-model_01-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_17-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8ec1aec4f4d976bea256c5222b44f207cb4d6c9 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_17-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d1a0ef4dcce750e1bb855c0025ea8d2f4ba8e1aa896761e08304f4b9b12fda7 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_18-model_00-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c04769d8d5b15ac22d6bc4863ce30d0a99620a7 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:941c252c45df264e286c1cd7a66cdb1bec019886f09b9b7b8933f77f3dead6d9 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_18-model_01-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_18-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2107bea3a81bab75d6b332ab9285f7ae1cf7c05 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_18-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ceaea5c7aeb012f16737d7080efd11a96136f204971fa6dcedb8d5bc0a3d2565 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_19-model_00-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..055ece28014b276f8a6312a40ba45509a0997cfe --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3ac02069131f3fa419c055a9640d09f9172c901d591bd310340e00ead5a334c +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_19-model_01-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_19-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccc6cac41cad53c750c215a1df0efb2719b39243 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_19-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c80faf9bbe8e6ea35a7ba47029944574bdedfeda7af946b73ff0b502b6e6216 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_20-model_00-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bc17fbb60cac9658ba1db89976d1170b84b40af --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14c99ec475838d6e61f4bb241306126f5bf141b580ab38ab7ac5916f1a5399eb +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_20-model_01-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_20-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..227ba029fe143077a87f7ba976a8d0a13dc07609 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_20-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90432a9568186c051d58d22f02a2de5c8917d003e17a062cae94a85e459797ae +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_21-model_00-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..07c0d149dd02742c2d93de6f3f778bc73cee5131 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12ff54efeade24931079c847c0cc9d89ce7a19929403eff7e0f0f7264912b548 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_21-model_01-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_21-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc007e0776b02b9c98fedf5bb5dee8ac92fcbbb4 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_21-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cb0cc427ed073091269e7d66cd53efd2a78825a784620437036b73cf2e303e9 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_22-model_00-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..efd3cf700e28620fe0add4ca8f0d6b6d59a1fea5 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec13ab46fe587fa95fa692c9a028230368d993db4e2c540d259e198f403d9275 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_22-model_01-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_22-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6f50a00d9b2b9ed74648e7c0355bec0fcc0c977 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_22-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db2212263ff3fb7d4ad9602bc35a16e226f3efb0adea50cd5c90c60ff4ef8005 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_23-model_00-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fcdaad932081e893d5d4c3aae9418448afe98ea3 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb7b612cf252103146280727d2a33bd932b36b71a39a5497526d1f8675d72438 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_23-model_01-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_23-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca7935276a5513116d52091422549c9c2988148a --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_23-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:246d4117b55864fcd4121f35c61418565de7446a165501f310b7c683904b51df +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_24-model_00-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..86712b1b2d6525fe9e4048b1ad30b95577e843e8 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53aa30dbcf340dd37a2b54e8844ef8b0fe15a80604fbe41c236da2faca13d318 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_24-model_01-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_24-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1854d2b1a71a25baf751920d7d56da098326b25a --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_24-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbec91c29763518cf03c8513dd187f317b59814f2cea8ad76a0ebc0b528a64e9 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_25-model_00-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd84e79b28797b271b691d826f6ce725653f42f7 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d55b926ecfe9e43b9c956720f7072c5db873e659ed56fdc120c6df4501e93469 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_25-model_01-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_25-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..53a8630522dec4821ddce7a11b75d12d8acab6e5 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_25-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3c8eb813c17a1719163b6f7f030d0491b52141dbb237b2ea7b1e76c714660ed +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_26-model_00-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3825adee59a942417afb41fae9bf9873aba80843 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9db784eadbff7835f2188bfe2ec130db25097dc8593f24c1097a5093444201d +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_26-model_01-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_26-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..007c2c7582e444dd9ac54dff79539ef4352fa1a2 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_26-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1f4f8519df47ada44dbe6746a165e243dd880a057c4d4c0236fee0da4031968 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_27-model_00-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f441e81bfd7196b73afa1e060b9aafaa236a78b7 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7c8ec8319b7930d10f8e0472ac8abd93118afda5038c3867c1ec6317d584ec6 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_27-model_01-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_27-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..41a8d5849173791b4f47039de7b2c4deb3a27fea --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_27-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:621f87490c7f7561c564d726d288b6ce835174ce921cbbe9d7b5b2d0aa7845f8 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_28-model_00-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8853e3b2a60d71c430f4e9b811dd4804e7496d54 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17d7429f75d3d3894dbe96000e2e2b2fbb092e6b42ba977d4f4f723faf8cdd2b +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_28-model_01-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_28-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9a44275fa1c81a601b9ea7ad24de240a4825737 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_28-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93e6212d8ec4a25b947ef6c2420e63ae350b69ffa0551b1f920b8fdf5b0a542f +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_29-model_00-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_29-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..06315ce359431c90e1aa270fec79cbc49c035ce9 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_29-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cee6454a6c87c030c4cb731052c397c7ea834515e172f345339943260f96073 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_29-model_01-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_29-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f891648f1d6eb63438aa1ba5bd2d4d464ed00fc2 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_29-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f90fbf1621c3ccfc1c08064f5f7dfc1ad88b2ea7056fc8ed453062203eeaca6a +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_30-model_00-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8bb693c805bf4452bfa3933f2ed9b09b22369a0 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d6848ced9314841cc1154ab8f7c6f741370bfeb1e4e51249bbf2e5cf01cc8a6 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_30-model_01-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_30-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bb3aae356754fee88e161cd06a9d8be16c82401 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_30-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b2fba63aed07a4b4a4bbfd29b0bb2f8e628fc8d5ffe16e2943622b05200a62a +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_31-model_00-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_31-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c9b5bedfcdc9659a1297b881b01d35ad2931638 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_31-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7a6b905d5bbb79197158a69c14cf05ce6875d02e75007a9772d4b9973f24294 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_31-model_01-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_31-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f51a178951cc9c2cd4dc84951d759a316e8dbfc3 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_31-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f77897c94cd8b324b942239ac76aa8ad340e154efde664d96fb3f74bb75f0a2 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_32-model_00-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_32-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3c05d75a60d75f2c427223e14fbc35c326c509d --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_32-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf54bef9eee2cde959ff99d372bf79652524df995ac571c871b815a20dbb77bc +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_32-model_01-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_32-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf03d6aae015ec48f656f15c8a299b895e464a44 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_32-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcd0fdc7a56b1e2e06da42f5ebf6f501d5c70e6ccf93ba518ffff1dba2901f83 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_33-model_00-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_33-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1d44afc90e7fc42dde4b6d7434b12112bae36d1 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_33-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdd93208aff5ea2e55c33dae4f38cabf94968e9e44409badd6528985ae7b2b94 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_33-model_01-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_33-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a78a142f330cb93fd91e4bebfdd9a0cc31ce2ef --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_33-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:734e038b87116ec9a0533971ed488b2c7db4bfd37bad368ae7896c9304a993e8 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_34-model_00-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_34-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3d60ce7dc1aaf9f994bbc1a5d293a5356239140 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_34-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d10b3c3b3bc370ad2a8a9f383c6c4e9f7361e5ce5540c70d6c9406424d3e1a90 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_34-model_01-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_34-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a048cb62f5bf6d3236688a37b3cf9c4c50aeba92 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_34-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf8bafd25df065e606a3292e43a16b6a659a08e4e9443c314a1ef5349346c785 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_35-model_00-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_35-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1068cab18da9ad2d69a8af45b4c64ddc57404a69 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_35-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b54f143b5b1697ba8706522cbb17e654080c883068c65a8f012c4282ac28242f +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_35-model_01-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_35-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7c867f0759045c9bc929972ab07b52c24eaf751 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_35-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6d1ed74779df21713676efc9d6e773f675265dff80cb4dd68db4c7ef50b4087 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_36-model_00-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_36-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..22c333cd83c7cb9c1458ffdd20e961eb38799417 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_36-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08fee94c8a9493f4bfd3a2ea261b390a9cc406940e5a97d59cc7ea305986fee9 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_36-model_01-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_36-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9674580ac6ae2748fdce13ddcbb051e57d19c695 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_36-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae0cfccf47a537d404292a9d1f393830c268e164bfdda6d9b5573c1dea768cfd +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_37-model_00-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_37-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..700cbced54e3388ec2f4a095eab3d1f5795b567b --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_37-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e683b51a0ba6c64d584e82c36197e13edee2ba6f26437586d9407335727a1458 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_37-model_01-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_37-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..39f0a4c119b8223e82b9fc51734d11064bfad19d --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_37-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14d89b7212355baa1f68d4e57a333169ab5237258979d60cdff658d5ddbc612d +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_38-model_00-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_38-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4684281302d52304be510181621d9d253683c49 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_38-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29ef9b100452863e5c5d5d8a361ed42f2fdc30b85bb2e7d0cbe21ecf7887dada +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_38-model_01-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_38-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae99af8ac762592d2f05fe0b7ef9c20cf1d9d103 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_38-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77891e55cae2ccfaef92f4b8122fa0466095c35a7955b433e9be252f2c31ef08 +size 113308931 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_40-model_00-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_40-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..31f75ab2b5a09b439e7c5e0cf20f8a63ba31a789 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_40-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b4cf3d0ed15c02a4c64fc37f23aa04133e2b830dfd47bcdf6733e0c1633e989 +size 13507 diff --git a/4b284b84bc4v2seed2/global_step80108/layer_40-model_01-model_states.pt b/4b284b84bc4v2seed2/global_step80108/layer_40-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8deac7eb458babceb9fd795c6a60f1168f9452b --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/layer_40-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d92b375e320fa073d16c8cb0ffaeae0350134d1b552b2ec61c3fa49eea790262 +size 13507 diff --git a/4b284b84bc4v2seed2/global_step80108/mp_rank_00_model_states.pt b/4b284b84bc4v2seed2/global_step80108/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fea88589f72434a9ed7d1534c0b35d7743fc6c36 --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b81f837e67279b92e0b4181c85fccce8d6c388e017068b255a2fa151edf5aba +size 51443 diff --git a/4b284b84bc4v2seed2/global_step80108/mp_rank_01_model_states.pt b/4b284b84bc4v2seed2/global_step80108/mp_rank_01_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6940932d0cca8dd68e153611076d6340fc6a8a4c --- /dev/null +++ b/4b284b84bc4v2seed2/global_step80108/mp_rank_01_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7728265d048641e1eb446989df6745454a84ffe1dc06ccd10cc531139f405b00 +size 51443 diff --git a/4b284b84bc4v2seed2/transformers/config.json b/4b284b84bc4v2seed2/transformers/config.json new file mode 100644 index 0000000000000000000000000000000000000000..df814c3a71ee49044410636b5eeb4f43611690ba --- /dev/null +++ b/4b284b84bc4v2seed2/transformers/config.json @@ -0,0 +1 @@ +{"vocab_size": 50432, "n_positions": 2048, "n_embd": 3072, "n_layer": 36, "n_head": 24, "n_inner": 12288, "activation_function": "gelu", "resid_pdrop": 0.1, "embd_pdrop": 0.1, "attn_pdrop": 0.1, "layer_norm_epsilon": 1e-05, "initializer_range": 0.02, "summary_type": "cls_index", "summary_use_proj": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "scale_attn_weights": true, "use_cache": true, "scale_attn_by_inverse_layer_idx": false, "reorder_and_upcast_attn": false, "bos_token_id": 50256, "eos_token_id": 50256, "return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "tf_legacy_loss": false, "pruned_heads": {}, "tie_word_embeddings": true, "is_encoder_decoder": false, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "suppress_tokens": null, "begin_suppress_tokens": null, "architectures": ["GPT2LMHeadModel"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": null, "prefix": null, "pad_token_id": null, "sep_token_id": null, "decoder_start_token_id": null, "task_specific_params": null, "problem_type": null, "_name_or_path": "", "transformers_version": "4.25.0.dev0", "n_ctx": 1024, "gradient_checkpointing": false, "model_type": "gpt2"} \ No newline at end of file diff --git a/4b284b84bc4v2seed2/transformers/pytorch_model.bin b/4b284b84bc4v2seed2/transformers/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..2ce54a30eb762d7ae97e7a506796038278258ce9 --- /dev/null +++ b/4b284b84bc4v2seed2/transformers/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c637981827c59373903a5af1066ea5dab49f86731d33967942fd8b0a45e8e144 +size 8781203669 diff --git a/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..d01e2a393761b36a43bcbbc29836ca75081949d5 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.33698931558059864, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03520091082802491}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.06832528700117271, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002020031616020774}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.24924535874354928, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004710667742123965}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.09682464818590401, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0021746201526808115}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.031623603705718525, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010704082391642267}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.12321043440007193, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0031299036359367484}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.04638572157936821, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0013302529021085698}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06503251084712686, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0018228814683563853}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.242120358957363, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0045711852361007615}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.09281887400756049, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001998996594014213}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.06504280718043812, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0018744892527656203}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.23925679819243256, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004467359403537819}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.09242326380243195, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002033441173958409}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..b40590e2f060191d33ec44b240418fc06c22b2d6 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.50071840910503, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04570119173979742}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07262405538535584, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0015025709069587576}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3545200580306086, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005274328693296472}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11243638843069366, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0020002359883771006}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03411790558117329, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009146851141661013}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.1735824312348198, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0036281888114770787}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.052828679189574415, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012458061281784743}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06858742604428675, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013499175148544084}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.33533941614782714, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.00489862350776037}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10640900334612001, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018168238044968257}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.06889204707695668, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014115064627086959}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3353795561043291, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0048767168213307635}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10662100746126313, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018761173400960428}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..22499ab7a72acfdeabf661dd25d5947f9add7eb8 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.5940498197237445, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.045360168270571564}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07459577331672164, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001595194413101619}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.38907556546905864, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0054304691316662745}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11593737527731507, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001949513588062909}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.035114673270987544, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010081353981524028}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.19584375989737013, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.004008082321996039}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05449451670049787, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012399615319130626}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06931044734650851, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001428917200995628}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.35996374778547313, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0049025475018146785}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10783733998051759, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017619447024028836}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07079493663216743, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0015053431740885688}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3670729702378272, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00501564179221856}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10992722332009006, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018365522736996146}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..e8188cac0ce0f2a11e582c1f2f880e8801c48603 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.6360838559544998, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03653875799485711}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07236011578940099, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0013910988503604417}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3928435128894812, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005384069245593369}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11355856417583833, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017735693070030508}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.033363396708401855, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.000803140401456714}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.19915667523109754, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.004011860806625624}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05302505138393545, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011266752102525668}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06687767191203486, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0012600410796976124}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3592559338816392, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0047582409926964905}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.1048768596135265, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016046493945327915}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.0682810245315365, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0013111163093307867}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3687377662903542, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004960565943300161}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10707993411906895, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016657550135363104}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..040db93aeb8941a65221717df873b7f9a23d8989 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.7027350329668681, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0419156836814436}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07411348564826069, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0012900003957059321}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.40994918124441987, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005364326251363318}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11781335466174786, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017761239549537581}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03434960773754005, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007831150259881873}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.20756196914680475, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.004035186327369416}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05494234282461018, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001125668640595295}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06799320620725614, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011446709666944061}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.37268673451611783, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0047156874564148465}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10796130107897399, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015796761570714324}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07001046072193005, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0012147694362971294}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.38481667508014805, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0049365819422690195}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11115469880289687, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001670218626963014}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..b0ca0e6adc23664390cd0816f1bff66fd0dc31a8 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.7868609033139111, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.040304136105284674}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07559215659324663, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0013368561782119886}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.4322159752184723, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005507418892615091}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.12053057909919479, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017893350216202717}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03531136059294999, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008350132401271129}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.22153138326278524, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.004197864843142094}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05660554273746949, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011398496071974332}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.0683868166969706, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011383097189411916}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.387608398091316, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004759866077492818}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.1089770281372542, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015496587154532736}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07105854805056085, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0012600458442573047}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.40338460571037565, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.005019831598860692}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11313127630281221, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016759508017601735}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..19a800614d90ec46f65e99a8a68f606fe3e814f3 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.14983850803367624, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018751672389164477}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.2550580803178272, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0027794243641439476}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.1749169386171503, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018652551820908833}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.030382874922609843, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007519667664767079}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.054505775605249815, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0014473521383030284}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.035914103574269995, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0008571739488027627}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.11682287834978397, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013372228496992414}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.20560214095840312, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022848479838345685}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.13780562967661653, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001358236237017717}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.13742857779903467, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0017113854895127892}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.23501911131597872, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0025756220873118974}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.16059954854119637, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017011067980149748}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.5100556841549206, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.056240452574111845}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..1d35030676958cc641a2c659c705d720933d8f6b --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.1965390881322699, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0022899400776314653}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.3206094100455321, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002849589854137116}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.22285165404429813, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019735517320632746}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.05045558070635316, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0011660432710824278}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.08246262292072058, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0017565984624132588}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.056001917384198796, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010665112573503633}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.13895822267839106, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0016253397048819503}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.23337530287957864, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022628070507281664}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.15830852566063647, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013457659853471373}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.18479852886338183, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0021643241999535143}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.3019972782519105, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002703215847122071}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.20945729941888908, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018462891651681006}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.965142818939576, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.06637064806778528}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..69d518dfe198bfd67a236b337b004a946a277b48 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.20155746658889173, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0023374350511286197}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.3173353129081016, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002820895911494938}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.2236964233973595, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019023763735918212}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.05269972304999503, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001197033866295586}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.08395356718136517, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0017436680982696616}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.05753113933914173, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010826117471515486}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.14470120145484863, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0017283958163244364}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.233378725309496, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0023004114225280213}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.16108340919074526, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001357852843091288}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.19006446021144513, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002218603404878938}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.30023601631924435, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002704859202966948}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.21101035224845988, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001793590665001926}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 3.092360521821163, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08937218000390199}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..1d6f4fed8ccf992b00856631a07799e509aa1b22 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.17379375635824176, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0026246110896642268}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.2638936090552038, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003388128200410466}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.1865213351213735, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022753171506905965}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.04282623790563042, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0011568698796170502}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.06755023246625483, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0016980876475847096}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.04592788875910395, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010286025903021396}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.12470876767206059, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.00198989611192214}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.1925552246827813, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0026451539087018585}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.13306544091830314, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015985646389652382}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.1641047927743934, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0024936634430607935}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.24985286020591305, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0032309944265283695}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.1760787377574676, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0021410940507585008}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.9732444729240193, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09147492615114675}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..bb3d48d95f985233d0868848538d1375ba8e7ec5 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.059448771232523664, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002218569421407597}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.08822441141978317, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003020915797584135}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.0605919538076038, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0020099409218817697}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.014949718004119315, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008976901887326936}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.02428038352612278, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001276025523659211}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.015593229425275027, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0007474058630918573}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.0446701681314208, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0017283868647508462}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.06670046801956148, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002362351165144592}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.04486687523926569, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014834001600610909}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.056074265222838884, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0020960296913534976}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.08343237936875103, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00287322955407947}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.057104894137255724, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018950436973998253}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 0.6533679656816203, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04947451807737188}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..a893aa760117f39b7f35a9ca36ac5f8c086a0044 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.009348211882001287, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0009832878517389112}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.013688335464355616, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0013308943056046898}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.00929579656840014, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0008648371348177522}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.002530983918335585, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00045036458463964445}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.00396277708838197, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0005637401793403029}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.002384610836596322, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00028677749720556095}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.007189697647068899, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0008082293363466722}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.010450449827034726, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0010632636910403864}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.006964849797303445, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0006505850643049141}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.008774341101660414, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0009302597680921362}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.012985553018433522, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.001276501870842985}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.008747681514956059, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0008159791184455816}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 4.1457161238536384e-07, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 9.147191188223124e-07}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..37b468f63b7774a681b569837ae470b2ee538e35 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 0.37083773151234173, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.023770267793187624}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.06608746744853429, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0006810687592344808}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.14195087368704973, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0012610802186243078}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.08851879719705498, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0008401305153826185}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.0034258087224012515, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00032514807417983457}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.00704033391818721, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0006361810577325418}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.0045379311452906496, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00042315898801261495}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.06585617168656571, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0006670941024074856}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.14144906524240433, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0012314615868737277}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.08820722536535333, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0008208954817151469}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.05497072058739539, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0005636175471074675}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.11929179350942047, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0010831868664373235}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.07382731521584816, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0006992840645883968}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..cd594482735765cbc2383c54f21b211f66f3e591 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 11.210308239038657, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.13532926187041483}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5337134369290545, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0033441618301280323}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4186112103011673, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003029511762554002}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.44364097425563637, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0024213391823928623}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2503358019053269, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0025907821242386786}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.19267261882751974, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002098816040806122}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.20464247864479315, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0019524189816088483}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.3856908650245338, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002931334041050201}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.2989387799212162, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024147108908862333}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3179154131738048, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002060565311895604}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.4329536166939937, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0031784168539919287}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.33757778280843753, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027140890148101187}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.35856203407161186, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0023230420120309756}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..62334524f0ec589dcff94b031d4088750b2e6b33 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 12.855010359789356, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1433052434909132}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5659453062773773, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003270807439335411}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4426574876800998, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002892096018797496}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4715984211104789, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002279297442582234}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.27838189797515667, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002671533749085893}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.21363966698505715, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0021189348260758872}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.22811726769856144, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0019828962661021204}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.4103597152277875, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002911142472749296}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.319223478072641, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0023906932022469385}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3403464767676166, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020236690372816674}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.461695670382684, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0031155745746790013}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.36069384550050293, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002666755684059944}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.38431431509550784, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022508604583330134}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..d940d8ee8d45c9ed74c40389d8101f909a17602e --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 13.64156249802983, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.15061545188803951}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5750153314520224, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0031859723554921284}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4510440289695527, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028677830005739494}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.48080915530796386, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002234979483832272}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.28884561820039295, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002639498857757876}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.22357397871649595, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0022043371695741783}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.23831207673207944, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002020312344935205}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.4195446580367559, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0029133142431469273}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3276080175727646, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024527144670301914}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3492803919842545, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020660644514658923}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.4727009044140323, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0031160796738222674}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.37055635583114344, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027125904536736854}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.39480073772752605, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022686218848066435}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..36262befbd016bb4db307754e2b8d2bfe68f5d93 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 13.48978762764689, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.18010374224713105}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5783755973364397, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003188421667895018}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4521748484155905, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028320142916950963}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.48299936414020656, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0021956091228780565}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2905353846413916, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0026426279354766213}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.22353380032103162, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0021373490578138086}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.23895749463268698, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00196124259284921}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.4173159956369907, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0029141064950507158}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3255911950461323, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024733626405686934}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.347484945544206, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002079636990372097}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.4733193294500394, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003118544106260605}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3704278657572045, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027237053634839347}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3952584823764592, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.00227735538013133}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..025a655d7b92d91b419711154525d7462544a2cb --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 13.585319575612113, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.15871453640685637}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5799683476103964, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0031994912520596636}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.45706214916858773, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002844413918683844}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.48786585090169554, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.00223672743807504}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.29236226184175695, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0026385490403355457}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.22695605327657692, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0021727413185400174}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.24237216469601944, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0019981286651549568}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.4148253441054077, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.00283534958682861}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.32700945528721864, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002473535129442898}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.34850083462923376, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002084486638424466}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.4734672508470655, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0030825263814209243}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.37359433682039755, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027168498928153875}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.39837100157486816, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002290117281740733}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_0.json b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..c659975e755c4b7b9bed049448ab7f8a3fbd43ff --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.16876091355105496, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002428477465457079}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.3341076035740682, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0046048681292224745}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.2136631527247442, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0026638229066998256}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.03747194366522528, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0014955773574022288}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.07911851428210626, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002822698047160193}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.04856213249829562, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0017561436649774235}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.1271557431168007, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0019539789800342004}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.25284226031166046, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0036682449427253147}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.1610160340198798, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0021142466349326873}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.13217520866885155, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002071100870900028}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.26428103009111936, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004079358230845003}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.16787123550272315, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0023335572634387495}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 2.1113783413326344, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.11912014552832849}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_1.json b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..cb3aa915432261379606ea2648cb09c3b709af6a --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.12927526554265445, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018265553859337874}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.3185510498370038, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004229864775990553}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.18170879656881125, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.00245218614539981}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.02602935902165096, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001023224048321341}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06652536681300213, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002722006503197127}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.03694944789541673, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001451072652969939}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.09989029850197624, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013879057374961837}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.2479107129331233, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003381030448367971}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.14062720750461896, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018793551451232017}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.10341765201003357, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0015149831274551388}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2571991639086138, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003711770412976227}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.14570314466301257, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002064223760081791}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.4807516008262442, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.10561063787286398}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_2.json b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..a3f8b7e96ad90510674e76507377fbffe80fe1f6 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.13145946154632493, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018544974879548131}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.32387324210035007, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004267761663343424}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.1847484789507431, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0024906095591687542}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.02808308652134632, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010347320981807847}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.07187873077263424, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0027472238907884166}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.03989446165864525, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001470552354617615}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.1019161886732123, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001391499897049356}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.2535896765342832, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0034183375598958493}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.14356843077788037, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018927425748884437}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.10460558980438973, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0015202856124887812}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2605683575765448, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0037100189499078345}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.14741895358409335, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020743741796644924}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.6562203262313626, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07982304015370187}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_3.json b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..04446cc07b38fbb10261f4f0f9f826693ef7da3c --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.13318228571463592, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0020455353549147103}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.317018855215892, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004518876538639268}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.18390048441125048, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0026657496989706104}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.028785220783836416, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010625475528616283}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.07136621731857556, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0026618058930387434}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.040350616115479146, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014683337326124046}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.10172139078346341, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0015298521300718705}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.2445625759480037, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003569632794081247}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.14086692618233734, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020271972409091304}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.10639989816115737, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0016639989017194455}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.255751047100679, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0038734069167402317}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.14729860857759783, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002200650446133668}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.7657291524477807, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.11405030461208435}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_4.json b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..66a4e78d4c6e71237fda5db3391b928fa5bb9bf0 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.0415260420063545, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0026056508945012298}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.07757055211542944, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004506312599731837}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.04858562888319941, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0027184130065024178}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.0074966026006513965, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0006746135809758764}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.0173613412544955, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0015976731193386722}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.009949994948206649, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0008716091074829112}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.03194572657523972, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002158988118941094}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.05898387332591097, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003484814745152857}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.036593331243362004, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020450096289478343}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.033578484743865225, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002237487835101602}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.06211470890687305, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0036822940469355132}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.0385888024512549, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002163672046764109}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.7368905267923197, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.10568292014256596}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_5.json b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..2cbfdae1cf13c46064b95ad260a8e4ba19d5d8e6 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/agg.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.0029927391798704375, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0008124604444580753}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.002590023053043221, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0006974154226908588}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.0027194147089883844, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0007296230437372524}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.000247284899936924, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00011058519545078262}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.00019440465195182176, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 8.882271405728297e-05}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.00021508550838189274, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 9.668205684028845e-05}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.002007763097414947, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0005311869704827251}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.0017507054146174415, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0004724443085314579}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.0018356640850194482, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0004879741431962152}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.0022522452753482606, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0006086895267107963}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.0020127265562168294, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0005598466140344547}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.0020761523840976182, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0005629570167031783}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.4041260567643717e-38, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 1.3322404897773207e-33}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_0.jsonl b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..d5f7ba36e27541b82ad2bfc939cb6acfa6529e80 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dfffea28de0dce740c616d3ea36cde512c367bdeec33ae0669ca11f1b41873b +size 4063199 diff --git a/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_1.jsonl b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e80cc641c258e6f6ed42f36db5b5fead966b77fd --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:837b68ee10345fa2eb2c743defc158997decfc0767e3b1bade5607a86ba091fc +size 5108680 diff --git a/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_2.jsonl b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..8d2c4eab8f7f7b2ba38bf2364bbe87833c49fe1b --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bbb0db2c4c5d75d0d054e17af9a0ed151190c4d9c81a4edbe00030318890bc5 +size 6047187 diff --git a/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_3.jsonl b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..b365505028656634dceaaa7b252734e970e64cab --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3118a978cb4115021e0b178800515dce6a9b128f0f91ba71bbca0d188d48740c +size 6977209 diff --git a/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_4.jsonl b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..cdc2af130aeda253cca6dbb56e649ceb37f251cb --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87d8b735d8967c389df334a08f955ccf233b1bdcbc004faaf19398cc54f6038f +size 7881728 diff --git a/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_5.jsonl b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..87ada49ec6a2dccf391953b92e42b66385e9b43a --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a91cf03c20b593af58f2159d800f87904fbd4d18fbac4d1ead91c72958f60a7 +size 8811603 diff --git a/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_0.jsonl b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..7e9392b6f79d44b84af631f6b6907014925811bb --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:340268481d81817e226cb97f609d344385d0a87e6ac4443bfb8a80d148db732b +size 7686779 diff --git a/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_1.jsonl b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..33b9956b61aa5ed8fbe40c6b079c81539989c974 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d1ab377890b38b35dc5a5b4900ff6b2d179de0904684fd9aaf1cdc21674bfe4 +size 13306483 diff --git a/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_2.jsonl b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5f28dfd7ca34a9066a9d624eebabc72759024239 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4946bb8bbeaae607d2dd87f328f0596a443fc0e6e1929c97aace9042bcaca5e +size 18903504 diff --git a/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_3.jsonl b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..2f9d9d631194208cc1cf0c6099b0423bfe7dbcd4 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52630c6c61a65df5a9dce85580243e224dc59ee516851c89a1592c70e106cd7e +size 24322671 diff --git a/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_4.jsonl b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..0bd13a081bb563163a39443e1b6f9c9df1eea520 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:394ab9dffe66303f6d0beddc5308586e139c895dada3fa96ca6c1dbf89b7a897 +size 29467378 diff --git a/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_5.jsonl b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..ab3f0f9a51467097ac8dc3dfce24ea5a424a18bf --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c15a5ef459e948f7bfbd6d68227e1762b2ce7637fc2f7175aa9a5e6991b10b2 +size 34797915 diff --git a/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..334086af207f729517b21cf0016fcce9660012a2 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7f58720413cce4837889658f028c48ca407f972c07046ae5fb226055bb7e6f4 +size 4616393 diff --git a/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..755db4971ad5f705d65a86f6fa0753bf0faf3a2d --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b65c8b56a12703bcf7b31b38716b860975edfe6050ba949d98a54d6eab283bd3 +size 5024615 diff --git a/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..f3162c7fe596344f1bc3ae95d2875bb2e92a89f3 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c299919474ce86ff8f670e5f40e4e54524d6772c983f6b49165fc988d5cc8cb6 +size 6111028 diff --git a/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5719be9c013f34b694c8f6bbd4cfd69141719ebe --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:425fb1923ba3668a1ca862c2df2f30f1912cfca5e79966ea362410ecf5ed6f96 +size 7193818 diff --git a/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..48b2e072ab7e78170940849b988f2294169caa1c --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9af39f456f44d976744a15136777bbd27723d2068a7faffaf93850ca44f0b38 +size 8272155 diff --git a/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..bb6eab40f216d9d979a231423ff4d85ed8cc2839 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3c0f3949ed1535cf13a0fbcbdd899dbe80f5656afdef653fecd64272cec6657 +size 9362106 diff --git a/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_0.jsonl b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5ccf88079b9ab3c7e17836f8257f268ff4561887 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ba4d80e0ad5953066899d7f12b3531414fed94a64628b213b7abdc853c1f959 +size 2786916 diff --git a/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_1.jsonl b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..9acc4253cfaf6cb00557c97ecc2d68fc9b9b26c6 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:501744cf72e59f0f9a5f2c71a866b31bb359e08c3ffce8748c27b8d96e7f4b40 +size 5102712 diff --git a/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_2.jsonl b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..31f038e97f8a2df387f0a16ec89ec5dc73c3318e --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3235d0b964601c05aaf451b72ac19a7ce64bd3883fc67053155797ec5a05ebce +size 7377919 diff --git a/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_3.jsonl b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..4909e495ca24b4cd5aff8a778bd582b0f3d336c8 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07a898cace64631b796782ff169bf60ddb0a3298de532b2899ca334f25cc8e53 +size 9646871 diff --git a/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_4.jsonl b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..23ed8e4216fedc676e225815b20d85bd24939092 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dc7925d9594a2db252572ba4c43a213d60cd5c6238bc7541fa2b14e3c238715 +size 11671883 diff --git a/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_5.jsonl b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..ee4e4600ddfce4f1161ad4eeac1ae73143064f95 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/examples.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b14b1bd74fe0b2008040e2c4461db3caebadbc1d84ba947436fd9c7015996db +size 13897542 diff --git a/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..4794045fc500c1b42ea1b3552ef35481ef039443 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.33698931558059864, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03520091082802491 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.06832528700117271, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.002020031616020774 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.24924535874354928, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004710667742123965 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.09682464818590401, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0021746201526808115 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.031623603705718525, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0010704082391642267 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.12321043440007193, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0031299036359367484 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.04638572157936821, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0013302529021085698 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06503251084712686, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0018228814683563853 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.242120358957363, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0045711852361007615 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.09281887400756049, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001998996594014213 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.06504280718043812, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0018744892527656203 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.23925679819243256, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004467359403537819 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.09242326380243195, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002033441173958409 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..ed273cb1c01511e4cab1bbaafeaa617fc30b29f7 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.50071840910503, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04570119173979742 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07262405538535584, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0015025709069587576 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3545200580306086, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005274328693296472 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11243638843069366, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0020002359883771006 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03411790558117329, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009146851141661013 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.1735824312348198, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0036281888114770787 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.052828679189574415, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012458061281784743 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06858742604428675, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0013499175148544084 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.33533941614782714, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.00489862350776037 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10640900334612001, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0018168238044968257 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.06889204707695668, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0014115064627086959 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3353795561043291, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0048767168213307635 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10662100746126313, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018761173400960428 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..0e22177cfa253b7fb4a6a7245f896abe42b05720 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.5940498197237445, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.045360168270571564 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07459577331672164, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001595194413101619 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.38907556546905864, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0054304691316662745 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11593737527731507, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001949513588062909 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.035114673270987544, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0010081353981524028 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.19584375989737013, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.004008082321996039 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05449451670049787, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012399615319130626 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06931044734650851, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001428917200995628 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.35996374778547313, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0049025475018146785 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10783733998051759, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0017619447024028836 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07079493663216743, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0015053431740885688 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3670729702378272, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.00501564179221856 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10992722332009006, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018365522736996146 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..1f18c981ed8b61057c6fb344f67e065ac76f2544 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.6360838559544998, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03653875799485711 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07236011578940099, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0013910988503604417 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3928435128894812, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005384069245593369 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11355856417583833, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017735693070030508 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.033363396708401855, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.000803140401456714 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.19915667523109754, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.004011860806625624 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05302505138393545, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011266752102525668 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06687767191203486, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0012600410796976124 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3592559338816392, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0047582409926964905 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.1048768596135265, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0016046493945327915 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.0682810245315365, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0013111163093307867 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3687377662903542, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004960565943300161 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10707993411906895, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016657550135363104 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..fc442dd262af81543c76d4459ed73f1ae93ba156 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.7027350329668681, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.0419156836814436 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07411348564826069, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0012900003957059321 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.40994918124441987, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005364326251363318 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11781335466174786, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017761239549537581 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03434960773754005, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007831150259881873 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.20756196914680475, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.004035186327369416 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05494234282461018, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001125668640595295 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06799320620725614, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0011446709666944061 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.37268673451611783, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0047156874564148465 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10796130107897399, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015796761570714324 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07001046072193005, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0012147694362971294 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.38481667508014805, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0049365819422690195 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11115469880289687, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001670218626963014 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..706120be68f3fb58817ffb976aac1742410fe5a8 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.7868609033139111, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.040304136105284674 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07559215659324663, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0013368561782119886 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.4322159752184723, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005507418892615091 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.12053057909919479, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017893350216202717 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03531136059294999, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008350132401271129 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.22153138326278524, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.004197864843142094 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05660554273746949, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011398496071974332 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.0683868166969706, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0011383097189411916 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.387608398091316, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004759866077492818 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.1089770281372542, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015496587154532736 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07105854805056085, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0012600458442573047 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.40338460571037565, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.005019831598860692 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11313127630281221, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016759508017601735 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..779482f5fd1632d9db44875d6d7a9173c24451d0 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.14983850803367624, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0018751672389164477 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.2550580803178272, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0027794243641439476 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.1749169386171503, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018652551820908833 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.030382874922609843, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007519667664767079 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.054505775605249815, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0014473521383030284 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.035914103574269995, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0008571739488027627 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.11682287834978397, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0013372228496992414 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.20560214095840312, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0022848479838345685 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.13780562967661653, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001358236237017717 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.13742857779903467, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0017113854895127892 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.23501911131597872, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0025756220873118974 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.16059954854119637, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017011067980149748 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.5100556841549206, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.056240452574111845 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..6a74c6be7fadab522689a67ed9419c0c074545ef --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.1965390881322699, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0022899400776314653 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.3206094100455321, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002849589854137116 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.22285165404429813, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0019735517320632746 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.05045558070635316, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0011660432710824278 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.08246262292072058, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0017565984624132588 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.056001917384198796, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010665112573503633 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.13895822267839106, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0016253397048819503 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.23337530287957864, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0022628070507281664 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.15830852566063647, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0013457659853471373 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.18479852886338183, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0021643241999535143 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.3019972782519105, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002703215847122071 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.20945729941888908, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018462891651681006 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.965142818939576, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.06637064806778528 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..9bc2c220e497313748d6a1489c1661ee5e76fc95 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.20155746658889173, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0023374350511286197 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.3173353129081016, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002820895911494938 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.2236964233973595, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0019023763735918212 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.05269972304999503, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.001197033866295586 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.08395356718136517, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0017436680982696616 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.05753113933914173, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010826117471515486 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.14470120145484863, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0017283958163244364 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.233378725309496, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0023004114225280213 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.16108340919074526, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001357852843091288 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.19006446021144513, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.002218603404878938 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.30023601631924435, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002704859202966948 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.21101035224845988, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001793590665001926 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 3.092360521821163, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.08937218000390199 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..5fdbf381d6bf29383df905118e454ea9ba829901 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.17379375635824176, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0026246110896642268 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.2638936090552038, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.003388128200410466 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.1865213351213735, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0022753171506905965 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.04282623790563042, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0011568698796170502 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.06755023246625483, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0016980876475847096 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.04592788875910395, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010286025903021396 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.12470876767206059, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.00198989611192214 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.1925552246827813, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0026451539087018585 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.13306544091830314, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015985646389652382 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.1641047927743934, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0024936634430607935 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.24985286020591305, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0032309944265283695 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.1760787377574676, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0021410940507585008 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.9732444729240193, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.09147492615114675 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..f941f26dc052e747ed52a5e4f9cba289bf44cb88 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.059448771232523664, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.002218569421407597 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.08822441141978317, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.003020915797584135 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.0605919538076038, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0020099409218817697 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.014949718004119315, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008976901887326936 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.02428038352612278, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.001276025523659211 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.015593229425275027, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0007474058630918573 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.0446701681314208, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0017283868647508462 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.06670046801956148, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002362351165144592 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.04486687523926569, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0014834001600610909 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.056074265222838884, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0020960296913534976 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.08343237936875103, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.00287322955407947 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.057104894137255724, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018950436973998253 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 0.6533679656816203, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04947451807737188 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..48ffa7010d488f828cc24c2621fc0cb84105be58 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.009348211882001287, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0009832878517389112 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.013688335464355616, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0013308943056046898 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.00929579656840014, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0008648371348177522 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.002530983918335585, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.00045036458463964445 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.00396277708838197, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0005637401793403029 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.002384610836596322, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.00028677749720556095 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.007189697647068899, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0008082293363466722 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.010450449827034726, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0010632636910403864 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.006964849797303445, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0006505850643049141 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.008774341101660414, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0009302597680921362 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.012985553018433522, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.001276501870842985 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.008747681514956059, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0008159791184455816 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 4.1457161238536384e-07, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 9.147191188223124e-07 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..7b0322c6f5cfa3af577dfd14618b029140e5eaef --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 0.37083773151234173, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.023770267793187624 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.06608746744853429, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0006810687592344808 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.14195087368704973, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0012610802186243078 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.08851879719705498, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0008401305153826185 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.0034258087224012515, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.00032514807417983457 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.00704033391818721, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0006361810577325418 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.0045379311452906496, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.00042315898801261495 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.06585617168656571, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0006670941024074856 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.14144906524240433, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0012314615868737277 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.08820722536535333, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0008208954817151469 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.05497072058739539, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0005636175471074675 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.11929179350942047, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0010831868664373235 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.07382731521584816, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0006992840645883968 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..edd38948f3cf893271610b3227969e415a702f11 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 11.210308239038657, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.13532926187041483 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5337134369290545, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0033441618301280323 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4186112103011673, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.003029511762554002 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.44364097425563637, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0024213391823928623 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2503358019053269, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0025907821242386786 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.19267261882751974, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002098816040806122 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.20464247864479315, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0019524189816088483 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.3856908650245338, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002931334041050201 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.2989387799212162, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0024147108908862333 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3179154131738048, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.002060565311895604 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.4329536166939937, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0031784168539919287 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.33757778280843753, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027140890148101187 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.35856203407161186, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0023230420120309756 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..fe558a8ee60e962dc19cbe7b66d3bfe5689488e4 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 12.855010359789356, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.1433052434909132 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5659453062773773, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003270807439335411 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4426574876800998, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002892096018797496 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4715984211104789, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002279297442582234 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.27838189797515667, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002671533749085893 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.21363966698505715, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0021189348260758872 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.22811726769856144, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0019828962661021204 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.4103597152277875, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002911142472749296 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.319223478072641, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0023906932022469385 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3403464767676166, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0020236690372816674 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.461695670382684, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0031155745746790013 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.36069384550050293, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002666755684059944 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.38431431509550784, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0022508604583330134 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..ed98a9d361827a80bcb8d6308d515338630c5834 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 13.64156249802983, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.15061545188803951 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5750153314520224, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0031859723554921284 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4510440289695527, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0028677830005739494 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.48080915530796386, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002234979483832272 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.28884561820039295, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002639498857757876 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.22357397871649595, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0022043371695741783 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.23831207673207944, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.002020312344935205 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.4195446580367559, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0029133142431469273 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3276080175727646, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0024527144670301914 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3492803919842545, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0020660644514658923 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.4727009044140323, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0031160796738222674 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.37055635583114344, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027125904536736854 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.39480073772752605, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0022686218848066435 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..0d48b3ce199cae7cc3987dfc6cf995eb6b1962a0 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 13.48978762764689, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.18010374224713105 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5783755973364397, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003188421667895018 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4521748484155905, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0028320142916950963 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.48299936414020656, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0021956091228780565 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2905353846413916, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0026426279354766213 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.22353380032103162, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0021373490578138086 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.23895749463268698, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.00196124259284921 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.4173159956369907, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0029141064950507158 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3255911950461323, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0024733626405686934 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.347484945544206, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.002079636990372097 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.4733193294500394, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003118544106260605 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3704278657572045, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027237053634839347 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3952584823764592, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.00227735538013133 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..536f65aba1b0208b39ee2dabe7c52501edb19bfa --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 13.585319575612113, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.15871453640685637 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5799683476103964, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0031994912520596636 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.45706214916858773, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002844413918683844 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.48786585090169554, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.00223672743807504 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.29236226184175695, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0026385490403355457 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.22695605327657692, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0021727413185400174 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.24237216469601944, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0019981286651549568 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.4148253441054077, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.00283534958682861 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.32700945528721864, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002473535129442898 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.34850083462923376, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.002084486638424466 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.4734672508470655, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0030825263814209243 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.37359433682039755, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027168498928153875 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.39837100157486816, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002290117281740733 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_0.json b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..019c8e07e7e27041ffcf6253b9adbb0dcdb12f30 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.16876091355105496, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.002428477465457079 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.3341076035740682, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0046048681292224745 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.2136631527247442, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0026638229066998256 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.03747194366522528, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0014955773574022288 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.07911851428210626, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002822698047160193 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.04856213249829562, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0017561436649774235 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.1271557431168007, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0019539789800342004 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.25284226031166046, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0036682449427253147 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.1610160340198798, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0021142466349326873 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.13217520866885155, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.002071100870900028 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.26428103009111936, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.004079358230845003 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.16787123550272315, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0023335572634387495 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 2.1113783413326344, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.11912014552832849 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_1.json b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..d33dee309dca2a061e8c50eecb9d8a4d075daa13 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.12927526554265445, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0018265553859337874 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.3185510498370038, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004229864775990553 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.18170879656881125, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.00245218614539981 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.02602935902165096, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.001023224048321341 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06652536681300213, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002722006503197127 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.03694944789541673, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.001451072652969939 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.09989029850197624, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0013879057374961837 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.2479107129331233, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003381030448367971 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.14062720750461896, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0018793551451232017 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.10341765201003357, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0015149831274551388 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2571991639086138, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003711770412976227 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.14570314466301257, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.002064223760081791 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.4807516008262442, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.10561063787286398 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_2.json b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..3388458ea02eefbba3b91a24b17afa27fbd578b5 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.13145946154632493, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0018544974879548131 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.32387324210035007, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004267761663343424 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.1847484789507431, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0024906095591687542 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.02808308652134632, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0010347320981807847 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.07187873077263424, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0027472238907884166 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.03989446165864525, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.001470552354617615 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.1019161886732123, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.001391499897049356 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.2535896765342832, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0034183375598958493 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.14356843077788037, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0018927425748884437 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.10460558980438973, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0015202856124887812 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2605683575765448, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0037100189499078345 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.14741895358409335, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0020743741796644924 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.6562203262313626, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.07982304015370187 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_3.json b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..c3a89751f4fb266d81855a53413298f3a2b5a0b9 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.13318228571463592, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0020455353549147103 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.317018855215892, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004518876538639268 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.18390048441125048, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0026657496989706104 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.028785220783836416, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0010625475528616283 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.07136621731857556, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0026618058930387434 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.040350616115479146, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0014683337326124046 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.10172139078346341, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0015298521300718705 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.2445625759480037, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003569632794081247 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.14086692618233734, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0020271972409091304 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.10639989816115737, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0016639989017194455 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.255751047100679, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0038734069167402317 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.14729860857759783, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.002200650446133668 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.7657291524477807, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.11405030461208435 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_4.json b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..2e16a352db13eefca56246030b84e279a1c88c9b --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.0415260420063545, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0026056508945012298 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.07757055211542944, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004506312599731837 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.04858562888319941, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0027184130065024178 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.0074966026006513965, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0006746135809758764 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.0173613412544955, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0015976731193386722 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.009949994948206649, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0008716091074829112 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.03194572657523972, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.002158988118941094 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.05898387332591097, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003484814745152857 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.036593331243362004, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0020450096289478343 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.033578484743865225, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.002237487835101602 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.06211470890687305, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0036822940469355132 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.0385888024512549, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.002163672046764109 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.7368905267923197, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.10568292014256596 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_5.json b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..0a2990e494ea10ceb5a678d31e4313a6a4bfe37a --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/generation/slim.4b284b84bc4v2seed3_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.0029927391798704375, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0008124604444580753 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.002590023053043221, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0006974154226908588 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.0027194147089883844, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0007296230437372524 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.000247284899936924, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.00011058519545078262 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.00019440465195182176, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 8.882271405728297e-05 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.00021508550838189274, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 9.668205684028845e-05 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.002007763097414947, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0005311869704827251 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.0017507054146174415, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0004724443085314579 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.0018356640850194482, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0004879741431962152 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.0022522452753482606, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0006086895267107963 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.0020127265562168294, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0005598466140344547 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.0020761523840976182, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0005629570167031783 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.4041260567643717e-38, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 1.3322404897773207e-33 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/rankeval/4b284b84bc4v2seed3_0.json b/4b284b84bc4v2seed3/evaluation/rankeval/4b284b84bc4v2seed3_0.json new file mode 100644 index 0000000000000000000000000000000000000000..cc43c07c112a8ca7433f2a5f4da0e4ed468fe6c9 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/rankeval/4b284b84bc4v2seed3_0.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.329, + "acc_stderr": 0.014865395385928364 + }, + "anli_r2": { + "acc": 0.326, + "acc_stderr": 0.01483050720454104 + }, + "anli_r3": { + "acc": 0.3433333333333333, + "acc_stderr": 0.01371263383046586 + }, + "cb": { + "acc": 0.375, + "acc_stderr": 0.06527912098338669, + "f1": 0.2127316680096696 + }, + "copa": { + "acc": 0.79, + "acc_stderr": 0.040936018074033256 + }, + "hellaswag": { + "acc": 0.47400916152160927, + "acc_stderr": 0.00498303542023572, + "acc_norm": 0.6269667396932882, + "acc_norm_stderr": 0.004826224784850451 + }, + "rte": { + "acc": 0.5595667870036101, + "acc_stderr": 0.02988212336311872 + }, + "winogrande": { + "acc": 0.5864246250986582, + "acc_stderr": 0.013840971763195304 + }, + "storycloze_2016": { + "acc": 0.7167290219134153, + "acc_stderr": 0.010419760409155363 + }, + "boolq": { + "acc": 0.5825688073394495, + "acc_stderr": 0.00862499005021668 + }, + "arc_easy": { + "acc": 0.6014309764309764, + "acc_stderr": 0.010046455400477937, + "acc_norm": 0.531986531986532, + "acc_norm_stderr": 0.010238767643185714 + }, + "arc_challenge": { + "acc": 0.26706484641638223, + "acc_stderr": 0.012928933196496354, + "acc_norm": 0.28924914675767915, + "acc_norm_stderr": 0.013250012579393443 + }, + "sciq": { + "acc": 0.85, + "acc_stderr": 0.011297239823409314, + "acc_norm": 0.752, + "acc_norm_stderr": 0.013663187134877637 + }, + "piqa": { + "acc": 0.7551686615886833, + "acc_stderr": 0.010032309105568795, + "acc_norm": 0.763873775843308, + "acc_norm_stderr": 0.009908965890558218 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/rankeval/4b284b84bc4v2seed3_0_lm-eval_global_step80108_2023-02-22-18-53-17_0shots_backup.json b/4b284b84bc4v2seed3/evaluation/rankeval/4b284b84bc4v2seed3_0_lm-eval_global_step80108_2023-02-22-18-53-17_0shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..cc43c07c112a8ca7433f2a5f4da0e4ed468fe6c9 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/rankeval/4b284b84bc4v2seed3_0_lm-eval_global_step80108_2023-02-22-18-53-17_0shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.329, + "acc_stderr": 0.014865395385928364 + }, + "anli_r2": { + "acc": 0.326, + "acc_stderr": 0.01483050720454104 + }, + "anli_r3": { + "acc": 0.3433333333333333, + "acc_stderr": 0.01371263383046586 + }, + "cb": { + "acc": 0.375, + "acc_stderr": 0.06527912098338669, + "f1": 0.2127316680096696 + }, + "copa": { + "acc": 0.79, + "acc_stderr": 0.040936018074033256 + }, + "hellaswag": { + "acc": 0.47400916152160927, + "acc_stderr": 0.00498303542023572, + "acc_norm": 0.6269667396932882, + "acc_norm_stderr": 0.004826224784850451 + }, + "rte": { + "acc": 0.5595667870036101, + "acc_stderr": 0.02988212336311872 + }, + "winogrande": { + "acc": 0.5864246250986582, + "acc_stderr": 0.013840971763195304 + }, + "storycloze_2016": { + "acc": 0.7167290219134153, + "acc_stderr": 0.010419760409155363 + }, + "boolq": { + "acc": 0.5825688073394495, + "acc_stderr": 0.00862499005021668 + }, + "arc_easy": { + "acc": 0.6014309764309764, + "acc_stderr": 0.010046455400477937, + "acc_norm": 0.531986531986532, + "acc_norm_stderr": 0.010238767643185714 + }, + "arc_challenge": { + "acc": 0.26706484641638223, + "acc_stderr": 0.012928933196496354, + "acc_norm": 0.28924914675767915, + "acc_norm_stderr": 0.013250012579393443 + }, + "sciq": { + "acc": 0.85, + "acc_stderr": 0.011297239823409314, + "acc_norm": 0.752, + "acc_norm_stderr": 0.013663187134877637 + }, + "piqa": { + "acc": 0.7551686615886833, + "acc_stderr": 0.010032309105568795, + "acc_norm": 0.763873775843308, + "acc_norm_stderr": 0.009908965890558218 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/rankeval/4b284b84bc4v2seed3_1.json b/4b284b84bc4v2seed3/evaluation/rankeval/4b284b84bc4v2seed3_1.json new file mode 100644 index 0000000000000000000000000000000000000000..0177e9b075d745bdb2f14fe8385744b2e4ab086c --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/rankeval/4b284b84bc4v2seed3_1.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.327, + "acc_stderr": 0.01484221315341124 + }, + "anli_r2": { + "acc": 0.332, + "acc_stderr": 0.014899597242811492 + }, + "anli_r3": { + "acc": 0.34, + "acc_stderr": 0.01368049572576779 + }, + "cb": { + "acc": 0.5, + "acc_stderr": 0.06741998624632421, + "f1": 0.35057471264367807 + }, + "copa": { + "acc": 0.8, + "acc_stderr": 0.040201512610368445 + }, + "hellaswag": { + "acc": 0.4731129257120096, + "acc_stderr": 0.0049825618152141244, + "acc_norm": 0.6270663214499104, + "acc_norm_stderr": 0.004825963768772216 + }, + "rte": { + "acc": 0.5306859205776173, + "acc_stderr": 0.03003973059219781 + }, + "winogrande": { + "acc": 0.574585635359116, + "acc_stderr": 0.013895257666646378 + }, + "storycloze_2016": { + "acc": 0.7140566541956174, + "acc_stderr": 0.010449259851345842 + }, + "boolq": { + "acc": 0.5788990825688073, + "acc_stderr": 0.008635491562221344 + }, + "arc_easy": { + "acc": 0.6031144781144782, + "acc_stderr": 0.010039236800583209, + "acc_norm": 0.5723905723905723, + "acc_norm_stderr": 0.010151683397430673 + }, + "arc_challenge": { + "acc": 0.28071672354948807, + "acc_stderr": 0.013131238126975586, + "acc_norm": 0.31313993174061433, + "acc_norm_stderr": 0.013552671543623504 + }, + "sciq": { + "acc": 0.892, + "acc_stderr": 0.009820001651345696, + "acc_norm": 0.89, + "acc_norm_stderr": 0.009899393819724446 + }, + "piqa": { + "acc": 0.7589771490750816, + "acc_stderr": 0.009979042717267314, + "acc_norm": 0.7616974972796517, + "acc_norm_stderr": 0.009940334245876219 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/rankeval/4b284b84bc4v2seed3_1_lm-eval_global_step80108_2023-02-22-18-53-17_1shots_backup.json b/4b284b84bc4v2seed3/evaluation/rankeval/4b284b84bc4v2seed3_1_lm-eval_global_step80108_2023-02-22-18-53-17_1shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..0177e9b075d745bdb2f14fe8385744b2e4ab086c --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/rankeval/4b284b84bc4v2seed3_1_lm-eval_global_step80108_2023-02-22-18-53-17_1shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.327, + "acc_stderr": 0.01484221315341124 + }, + "anli_r2": { + "acc": 0.332, + "acc_stderr": 0.014899597242811492 + }, + "anli_r3": { + "acc": 0.34, + "acc_stderr": 0.01368049572576779 + }, + "cb": { + "acc": 0.5, + "acc_stderr": 0.06741998624632421, + "f1": 0.35057471264367807 + }, + "copa": { + "acc": 0.8, + "acc_stderr": 0.040201512610368445 + }, + "hellaswag": { + "acc": 0.4731129257120096, + "acc_stderr": 0.0049825618152141244, + "acc_norm": 0.6270663214499104, + "acc_norm_stderr": 0.004825963768772216 + }, + "rte": { + "acc": 0.5306859205776173, + "acc_stderr": 0.03003973059219781 + }, + "winogrande": { + "acc": 0.574585635359116, + "acc_stderr": 0.013895257666646378 + }, + "storycloze_2016": { + "acc": 0.7140566541956174, + "acc_stderr": 0.010449259851345842 + }, + "boolq": { + "acc": 0.5788990825688073, + "acc_stderr": 0.008635491562221344 + }, + "arc_easy": { + "acc": 0.6031144781144782, + "acc_stderr": 0.010039236800583209, + "acc_norm": 0.5723905723905723, + "acc_norm_stderr": 0.010151683397430673 + }, + "arc_challenge": { + "acc": 0.28071672354948807, + "acc_stderr": 0.013131238126975586, + "acc_norm": 0.31313993174061433, + "acc_norm_stderr": 0.013552671543623504 + }, + "sciq": { + "acc": 0.892, + "acc_stderr": 0.009820001651345696, + "acc_norm": 0.89, + "acc_norm_stderr": 0.009899393819724446 + }, + "piqa": { + "acc": 0.7589771490750816, + "acc_stderr": 0.009979042717267314, + "acc_norm": 0.7616974972796517, + "acc_norm_stderr": 0.009940334245876219 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/rankeval/4b284b84bc4v2seed3_2.json b/4b284b84bc4v2seed3/evaluation/rankeval/4b284b84bc4v2seed3_2.json new file mode 100644 index 0000000000000000000000000000000000000000..1dfd092b583e9761502d727edc5d9b55afa07bf0 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/rankeval/4b284b84bc4v2seed3_2.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.308, + "acc_stderr": 0.014606483127342761 + }, + "anli_r2": { + "acc": 0.334, + "acc_stderr": 0.014922019523732965 + }, + "anli_r3": { + "acc": 0.32166666666666666, + "acc_stderr": 0.013490095282989521 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.0663363415035954, + "f1": 0.24493628437290407 + }, + "copa": { + "acc": 0.81, + "acc_stderr": 0.03942772444036623 + }, + "hellaswag": { + "acc": 0.47122087233618803, + "acc_stderr": 0.0049815090992763504, + "acc_norm": 0.6280621390161323, + "acc_norm_stderr": 0.004823341569605425 + }, + "rte": { + "acc": 0.48375451263537905, + "acc_stderr": 0.030080573208738064 + }, + "winogrande": { + "acc": 0.590370955011839, + "acc_stderr": 0.013821049109655478 + }, + "storycloze_2016": { + "acc": 0.7167290219134153, + "acc_stderr": 0.010419760409155363 + }, + "boolq": { + "acc": 0.6039755351681957, + "acc_stderr": 0.008553881336813415 + }, + "arc_easy": { + "acc": 0.6212121212121212, + "acc_stderr": 0.009953737656542037, + "acc_norm": 0.5963804713804713, + "acc_norm_stderr": 0.010067368960348216 + }, + "arc_challenge": { + "acc": 0.28668941979522183, + "acc_stderr": 0.013214986329274774, + "acc_norm": 0.310580204778157, + "acc_norm_stderr": 0.01352229209805305 + }, + "sciq": { + "acc": 0.903, + "acc_stderr": 0.009363689373248102, + "acc_norm": 0.893, + "acc_norm_stderr": 0.009779910359847167 + }, + "piqa": { + "acc": 0.7540805223068553, + "acc_stderr": 0.01004733186562519, + "acc_norm": 0.764961915125136, + "acc_norm_stderr": 0.009893146688805315 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/rankeval/4b284b84bc4v2seed3_2_lm-eval_global_step80108_2023-02-22-18-53-17_2shots_backup.json b/4b284b84bc4v2seed3/evaluation/rankeval/4b284b84bc4v2seed3_2_lm-eval_global_step80108_2023-02-22-18-53-17_2shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..1dfd092b583e9761502d727edc5d9b55afa07bf0 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/rankeval/4b284b84bc4v2seed3_2_lm-eval_global_step80108_2023-02-22-18-53-17_2shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.308, + "acc_stderr": 0.014606483127342761 + }, + "anli_r2": { + "acc": 0.334, + "acc_stderr": 0.014922019523732965 + }, + "anli_r3": { + "acc": 0.32166666666666666, + "acc_stderr": 0.013490095282989521 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.0663363415035954, + "f1": 0.24493628437290407 + }, + "copa": { + "acc": 0.81, + "acc_stderr": 0.03942772444036623 + }, + "hellaswag": { + "acc": 0.47122087233618803, + "acc_stderr": 0.0049815090992763504, + "acc_norm": 0.6280621390161323, + "acc_norm_stderr": 0.004823341569605425 + }, + "rte": { + "acc": 0.48375451263537905, + "acc_stderr": 0.030080573208738064 + }, + "winogrande": { + "acc": 0.590370955011839, + "acc_stderr": 0.013821049109655478 + }, + "storycloze_2016": { + "acc": 0.7167290219134153, + "acc_stderr": 0.010419760409155363 + }, + "boolq": { + "acc": 0.6039755351681957, + "acc_stderr": 0.008553881336813415 + }, + "arc_easy": { + "acc": 0.6212121212121212, + "acc_stderr": 0.009953737656542037, + "acc_norm": 0.5963804713804713, + "acc_norm_stderr": 0.010067368960348216 + }, + "arc_challenge": { + "acc": 0.28668941979522183, + "acc_stderr": 0.013214986329274774, + "acc_norm": 0.310580204778157, + "acc_norm_stderr": 0.01352229209805305 + }, + "sciq": { + "acc": 0.903, + "acc_stderr": 0.009363689373248102, + "acc_norm": 0.893, + "acc_norm_stderr": 0.009779910359847167 + }, + "piqa": { + "acc": 0.7540805223068553, + "acc_stderr": 0.01004733186562519, + "acc_norm": 0.764961915125136, + "acc_norm_stderr": 0.009893146688805315 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/rankeval/4b284b84bc4v2seed3_3.json b/4b284b84bc4v2seed3/evaluation/rankeval/4b284b84bc4v2seed3_3.json new file mode 100644 index 0000000000000000000000000000000000000000..ce5018faeab2ab62373880a3bcd2c7c134ed6af9 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/rankeval/4b284b84bc4v2seed3_3.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.316, + "acc_stderr": 0.014709193056057121 + }, + "anli_r2": { + "acc": 0.347, + "acc_stderr": 0.015060472031706622 + }, + "anli_r3": { + "acc": 0.3308333333333333, + "acc_stderr": 0.013588208070709007 + }, + "cb": { + "acc": 0.5178571428571429, + "acc_stderr": 0.06737697508644647, + "f1": 0.39707602339181286 + }, + "copa": { + "acc": 0.81, + "acc_stderr": 0.03942772444036623 + }, + "hellaswag": { + "acc": 0.47211710814578767, + "acc_stderr": 0.004982016702445961, + "acc_norm": 0.6292571200955985, + "acc_norm_stderr": 0.004820166002253063 + }, + "rte": { + "acc": 0.5234657039711191, + "acc_stderr": 0.03006330041190266 + }, + "winogrande": { + "acc": 0.5943172849250198, + "acc_stderr": 0.013800206336014208 + }, + "storycloze_2016": { + "acc": 0.7258150721539284, + "acc_stderr": 0.010316062787590011 + }, + "boolq": { + "acc": 0.6030581039755352, + "acc_stderr": 0.008557276964675146 + }, + "arc_easy": { + "acc": 0.6321548821548821, + "acc_stderr": 0.00989492346445519, + "acc_norm": 0.6123737373737373, + "acc_norm_stderr": 0.009997307914447612 + }, + "arc_challenge": { + "acc": 0.29948805460750855, + "acc_stderr": 0.013385021637313562, + "acc_norm": 0.31569965870307165, + "acc_norm_stderr": 0.013582571095815291 + }, + "sciq": { + "acc": 0.915, + "acc_stderr": 0.008823426366942314, + "acc_norm": 0.909, + "acc_norm_stderr": 0.009099549538400241 + }, + "piqa": { + "acc": 0.7611534276387377, + "acc_stderr": 0.0099481203853375, + "acc_norm": 0.7611534276387377, + "acc_norm_stderr": 0.009948120385337484 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/rankeval/4b284b84bc4v2seed3_3_lm-eval_global_step80108_2023-02-22-18-53-17_3shots_backup.json b/4b284b84bc4v2seed3/evaluation/rankeval/4b284b84bc4v2seed3_3_lm-eval_global_step80108_2023-02-22-18-53-17_3shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..ce5018faeab2ab62373880a3bcd2c7c134ed6af9 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/rankeval/4b284b84bc4v2seed3_3_lm-eval_global_step80108_2023-02-22-18-53-17_3shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.316, + "acc_stderr": 0.014709193056057121 + }, + "anli_r2": { + "acc": 0.347, + "acc_stderr": 0.015060472031706622 + }, + "anli_r3": { + "acc": 0.3308333333333333, + "acc_stderr": 0.013588208070709007 + }, + "cb": { + "acc": 0.5178571428571429, + "acc_stderr": 0.06737697508644647, + "f1": 0.39707602339181286 + }, + "copa": { + "acc": 0.81, + "acc_stderr": 0.03942772444036623 + }, + "hellaswag": { + "acc": 0.47211710814578767, + "acc_stderr": 0.004982016702445961, + "acc_norm": 0.6292571200955985, + "acc_norm_stderr": 0.004820166002253063 + }, + "rte": { + "acc": 0.5234657039711191, + "acc_stderr": 0.03006330041190266 + }, + "winogrande": { + "acc": 0.5943172849250198, + "acc_stderr": 0.013800206336014208 + }, + "storycloze_2016": { + "acc": 0.7258150721539284, + "acc_stderr": 0.010316062787590011 + }, + "boolq": { + "acc": 0.6030581039755352, + "acc_stderr": 0.008557276964675146 + }, + "arc_easy": { + "acc": 0.6321548821548821, + "acc_stderr": 0.00989492346445519, + "acc_norm": 0.6123737373737373, + "acc_norm_stderr": 0.009997307914447612 + }, + "arc_challenge": { + "acc": 0.29948805460750855, + "acc_stderr": 0.013385021637313562, + "acc_norm": 0.31569965870307165, + "acc_norm_stderr": 0.013582571095815291 + }, + "sciq": { + "acc": 0.915, + "acc_stderr": 0.008823426366942314, + "acc_norm": 0.909, + "acc_norm_stderr": 0.009099549538400241 + }, + "piqa": { + "acc": 0.7611534276387377, + "acc_stderr": 0.0099481203853375, + "acc_norm": 0.7611534276387377, + "acc_norm_stderr": 0.009948120385337484 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/rankeval/4b284b84bc4v2seed3_4.json b/4b284b84bc4v2seed3/evaluation/rankeval/4b284b84bc4v2seed3_4.json new file mode 100644 index 0000000000000000000000000000000000000000..85e7ed8057e91a489479bda37b70a8bba463b6c6 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/rankeval/4b284b84bc4v2seed3_4.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.328, + "acc_stderr": 0.014853842487270334 + }, + "anli_r2": { + "acc": 0.355, + "acc_stderr": 0.015139491543780536 + }, + "anli_r3": { + "acc": 0.35083333333333333, + "acc_stderr": 0.013782212417178199 + }, + "cb": { + "acc": 0.5, + "acc_stderr": 0.06741998624632421, + "f1": 0.26794871794871794 + }, + "copa": { + "acc": 0.83, + "acc_stderr": 0.037752516806863715 + }, + "hellaswag": { + "acc": 0.4726150169288986, + "acc_stderr": 0.004982291744069915, + "acc_norm": 0.633240390360486, + "acc_norm_stderr": 0.004809352075008949 + }, + "rte": { + "acc": 0.4729241877256318, + "acc_stderr": 0.030052303463143706 + }, + "winogrande": { + "acc": 0.5911602209944752, + "acc_stderr": 0.013816954295135696 + }, + "storycloze_2016": { + "acc": 0.7279529663281668, + "acc_stderr": 0.010290888060871242 + }, + "boolq": { + "acc": 0.6159021406727829, + "acc_stderr": 0.008506861063860244 + }, + "arc_easy": { + "acc": 0.6355218855218855, + "acc_stderr": 0.00987572928248244, + "acc_norm": 0.6111111111111112, + "acc_norm_stderr": 0.01000324833531377 + }, + "arc_challenge": { + "acc": 0.2977815699658703, + "acc_stderr": 0.013363080107244489, + "acc_norm": 0.3046075085324232, + "acc_norm_stderr": 0.013449522109932487 + }, + "sciq": { + "acc": 0.915, + "acc_stderr": 0.008823426366942324, + "acc_norm": 0.917, + "acc_norm_stderr": 0.008728527206074787 + }, + "piqa": { + "acc": 0.750272034820457, + "acc_stderr": 0.010099232969867486, + "acc_norm": 0.7671381936887922, + "acc_norm_stderr": 0.009861236071080751 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/rankeval/4b284b84bc4v2seed3_4_lm-eval_global_step80108_2023-02-22-18-53-17_4shots_backup.json b/4b284b84bc4v2seed3/evaluation/rankeval/4b284b84bc4v2seed3_4_lm-eval_global_step80108_2023-02-22-18-53-17_4shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..85e7ed8057e91a489479bda37b70a8bba463b6c6 --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/rankeval/4b284b84bc4v2seed3_4_lm-eval_global_step80108_2023-02-22-18-53-17_4shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.328, + "acc_stderr": 0.014853842487270334 + }, + "anli_r2": { + "acc": 0.355, + "acc_stderr": 0.015139491543780536 + }, + "anli_r3": { + "acc": 0.35083333333333333, + "acc_stderr": 0.013782212417178199 + }, + "cb": { + "acc": 0.5, + "acc_stderr": 0.06741998624632421, + "f1": 0.26794871794871794 + }, + "copa": { + "acc": 0.83, + "acc_stderr": 0.037752516806863715 + }, + "hellaswag": { + "acc": 0.4726150169288986, + "acc_stderr": 0.004982291744069915, + "acc_norm": 0.633240390360486, + "acc_norm_stderr": 0.004809352075008949 + }, + "rte": { + "acc": 0.4729241877256318, + "acc_stderr": 0.030052303463143706 + }, + "winogrande": { + "acc": 0.5911602209944752, + "acc_stderr": 0.013816954295135696 + }, + "storycloze_2016": { + "acc": 0.7279529663281668, + "acc_stderr": 0.010290888060871242 + }, + "boolq": { + "acc": 0.6159021406727829, + "acc_stderr": 0.008506861063860244 + }, + "arc_easy": { + "acc": 0.6355218855218855, + "acc_stderr": 0.00987572928248244, + "acc_norm": 0.6111111111111112, + "acc_norm_stderr": 0.01000324833531377 + }, + "arc_challenge": { + "acc": 0.2977815699658703, + "acc_stderr": 0.013363080107244489, + "acc_norm": 0.3046075085324232, + "acc_norm_stderr": 0.013449522109932487 + }, + "sciq": { + "acc": 0.915, + "acc_stderr": 0.008823426366942324, + "acc_norm": 0.917, + "acc_norm_stderr": 0.008728527206074787 + }, + "piqa": { + "acc": 0.750272034820457, + "acc_stderr": 0.010099232969867486, + "acc_norm": 0.7671381936887922, + "acc_norm_stderr": 0.009861236071080751 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/rankeval/4b284b84bc4v2seed3_5.json b/4b284b84bc4v2seed3/evaluation/rankeval/4b284b84bc4v2seed3_5.json new file mode 100644 index 0000000000000000000000000000000000000000..e80643c497e39ed0e9882780d370b285d82b3e1d --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/rankeval/4b284b84bc4v2seed3_5.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.341, + "acc_stderr": 0.014998131348402695 + }, + "anli_r2": { + "acc": 0.348, + "acc_stderr": 0.015070604603768408 + }, + "anli_r3": { + "acc": 0.3408333333333333, + "acc_stderr": 0.01368860079329693 + }, + "cb": { + "acc": 0.5, + "acc_stderr": 0.06741998624632421, + "f1": 0.2506410256410256 + }, + "copa": { + "acc": 0.83, + "acc_stderr": 0.03775251680686371 + }, + "hellaswag": { + "acc": 0.4731129257120096, + "acc_stderr": 0.004982561815214125, + "acc_norm": 0.6352320254929297, + "acc_norm_stderr": 0.004803812631994968 + }, + "rte": { + "acc": 0.49458483754512633, + "acc_stderr": 0.030094698123239966 + }, + "winogrande": { + "acc": 0.595895816890292, + "acc_stderr": 0.01379161066467086 + }, + "storycloze_2016": { + "acc": 0.729021913415286, + "acc_stderr": 0.010278188399635048 + }, + "boolq": { + "acc": 0.6116207951070336, + "acc_stderr": 0.008524357307908785 + }, + "arc_easy": { + "acc": 0.6397306397306397, + "acc_stderr": 0.009851002584732383, + "acc_norm": 0.6157407407407407, + "acc_norm_stderr": 0.009981120724601436 + }, + "arc_challenge": { + "acc": 0.3037542662116041, + "acc_stderr": 0.01343890918477875, + "acc_norm": 0.3191126279863481, + "acc_norm_stderr": 0.0136216961191733 + }, + "sciq": { + "acc": 0.921, + "acc_stderr": 0.008534156773333438, + "acc_norm": 0.916, + "acc_norm_stderr": 0.008776162089491132 + }, + "piqa": { + "acc": 0.749183895538629, + "acc_stderr": 0.010113869547069044, + "acc_norm": 0.7600652883569097, + "acc_norm_stderr": 0.009963625892809545 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/evaluation/rankeval/4b284b84bc4v2seed3_5_lm-eval_global_step80108_2023-02-22-18-53-17_5shots_backup.json b/4b284b84bc4v2seed3/evaluation/rankeval/4b284b84bc4v2seed3_5_lm-eval_global_step80108_2023-02-22-18-53-17_5shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..e80643c497e39ed0e9882780d370b285d82b3e1d --- /dev/null +++ b/4b284b84bc4v2seed3/evaluation/rankeval/4b284b84bc4v2seed3_5_lm-eval_global_step80108_2023-02-22-18-53-17_5shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.341, + "acc_stderr": 0.014998131348402695 + }, + "anli_r2": { + "acc": 0.348, + "acc_stderr": 0.015070604603768408 + }, + "anli_r3": { + "acc": 0.3408333333333333, + "acc_stderr": 0.01368860079329693 + }, + "cb": { + "acc": 0.5, + "acc_stderr": 0.06741998624632421, + "f1": 0.2506410256410256 + }, + "copa": { + "acc": 0.83, + "acc_stderr": 0.03775251680686371 + }, + "hellaswag": { + "acc": 0.4731129257120096, + "acc_stderr": 0.004982561815214125, + "acc_norm": 0.6352320254929297, + "acc_norm_stderr": 0.004803812631994968 + }, + "rte": { + "acc": 0.49458483754512633, + "acc_stderr": 0.030094698123239966 + }, + "winogrande": { + "acc": 0.595895816890292, + "acc_stderr": 0.01379161066467086 + }, + "storycloze_2016": { + "acc": 0.729021913415286, + "acc_stderr": 0.010278188399635048 + }, + "boolq": { + "acc": 0.6116207951070336, + "acc_stderr": 0.008524357307908785 + }, + "arc_easy": { + "acc": 0.6397306397306397, + "acc_stderr": 0.009851002584732383, + "acc_norm": 0.6157407407407407, + "acc_norm_stderr": 0.009981120724601436 + }, + "arc_challenge": { + "acc": 0.3037542662116041, + "acc_stderr": 0.01343890918477875, + "acc_norm": 0.3191126279863481, + "acc_norm_stderr": 0.0136216961191733 + }, + "sciq": { + "acc": 0.921, + "acc_stderr": 0.008534156773333438, + "acc_norm": 0.916, + "acc_norm_stderr": 0.008776162089491132 + }, + "piqa": { + "acc": 0.749183895538629, + "acc_stderr": 0.010113869547069044, + "acc_norm": 0.7600652883569097, + "acc_norm_stderr": 0.009963625892809545 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1149bdb30d41c5d17d0f56d7638554b2e63a9d9d --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1d15acecb6b2ba952364b4a85b6d9a011979778666e1d40fee765ece6bc8e3a +size 199058647 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d0d0d533b2f742a8940b725eb6cabd96ff015ed --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74f48349c575021c3aa1dfcc1215c94e9c87bb1041d289975b7536b68bd25fd4 +size 199058647 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..af44b2207ff2913aeea7d4a909ab78ad908f97fc --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b7fcbe60c7a63bcf3cd2d5ce1aeb4c83d4891cb1af27c32150b2517a6d6e2f3 +size 199058733 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d4176f7b38121a676e107f4c95cb0daecc49af0 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebcdb6becb77e79f1b987390fa71d8b0982e9a24fa8c305eaf0e009a79e9313a +size 199058733 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ca8bd1b6b6768ae5225522017f53b60d1edd89b --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4139426533b7eb24f7353954cbd6047fb2c74bbb21c45cd212d2cd39aa6c21a8 +size 199058797 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7dd4901576aa6855ef5c0b19d72617c55111b2df --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3bd24e6f3fee19677ea85716310ddfdf42b4ba2cfeca5dd14730aece73fe503 +size 199058797 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b10d55d87a54e9ec7dcab54809da46fd203c10e8 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9789d8e93056036950c7d0d61715dd6616027db87ad6002c6fe5a5bc366e625f +size 199058733 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3a60321b044b9151010a85df7d3a1c24df73265 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd0e4596c27a9bc92f54e5db3d7bdd206fcb3c6ef11e04ad93b8a0f6fffad6b8 +size 199058733 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..47a85d5c0609ddc4a6415bc7b61263ca503b5ff1 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:013fbc0f630f00945ddd421fdf32f49ca256c226da089f9b67a9905e7f8b4d3c +size 199058733 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..37f65661cdd6436769062c690569a052b03e53f7 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15dfee3de991abd3e35ae975be5b44551d815492ba485662bb4d445580a00ad7 +size 199058733 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..72ef47e0ef85db851fa6d1b790af3b13591c6645 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87bf13487d850d85fc9d647b1827d94e0441aaa6796441685f86ae69ac79f314 +size 199058797 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc058942db95acb9841dac0bbccaf03d370869ab --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bc429917674df2332ac470868f4f008846894d3440ed66dc5593127500e5cdf +size 199058797 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..82c761b8cda1f2a8d295628ab5c06ea2e5e557a8 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8893b1f1234da7806b71618eb345839a3480e59347fe96ad5519b44c22a805c +size 199058733 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..df7e1a5fc01790f55a46e858797a9a75f8ade809 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9843f2f48d2c67801ccba772da3356cd8d44ccd8279a62864786bde6351438ae +size 199058733 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c839849616ff08c9f35f2238b617d955ebee197 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6c8ddb569599b93f07042462fe60a6bd482e97e2012f2715037f7317ade17ab +size 199058669 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c35ba6e8aec012e3602f72aa0d459c6e1af6ff27 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82e2b4a233089c9ec6ad5335cd0b3241006d113eee748b1136b56f0141485228 +size 199058669 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa16f71d786d07eab4b563ab301aaeb73b3623da --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b99e027f5533d6d1b45ac0aa61e9e0b8ecdf0a79b2a9ee11cd26ba973bc7d4a +size 199058797 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0dd9db02b34b5f9a8d6d01ec48d336b3dfccda8a --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d4902809abcc1fcaf216e0fc9ccc2e474c5e7a305609d1dedc9eca225148045 +size 199058797 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e0aa6c0dfa1c86ce79127232dda4fe74fda04fd --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7258b4f96f94858ed4f10220d25662627c1810cc1e478b3434fc90fa7c143c8 +size 199058733 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..04c9b65aea237e8c57f717e5ce867ef31da9efef --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c349d5692834f5f25411447c9e1d2cb1b06614551cc804ce44c65988d34c26b2 +size 199058733 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..97d0dd69aa023256a7de89f85ed5b737bfd6a217 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c4110c717e2c9675ac557bb4cd2615d0911612f87f6a3cde67efca488ab5562 +size 199058733 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..41195f36136e71399249adecd2399b286ed7fb6a --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f8e734459246d46d84c6b8626391129404bc4802f5d880b17a6de2c340e5eef +size 199058733 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4802544fccf4431c7f5a3fae79e13dcc529872cf --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a66fd0bfe37256cb8020fbfef7ce11f1e3535b7b880d0af28977fa8044904a60 +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..34e977934913c56444f1bd971dff547b9a381bd8 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e39c5fbc04ea353c99e12a4f1b186138158ffce4492f077dfb5e4341df89e0d6 +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5508686c2b38bb484f1ad9778dcc62c4f8d95cc --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28c9c3124358acc84c259d721eba1cbeea2efba6d18040b350436494a468eeb8 +size 199058733 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8996bef749d3736ae30b31c13bdd019ae479924 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d765a0b072c36928f6ae0722fd3de9580af88e4269770b82c4df17360a6e89d0 +size 199058733 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9795bd5fa436e2891bdee031d8331a64d773a1a4 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cbafcc0044ebc1fbc80997156d1f117be768a4555d532173073a4c092935623 +size 199058797 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d168dfba07f7b68e85b9e268369ebb1bf5f6d38 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54f0eb9118449ff3031664c71528ed4c91c683d280820f99410dda9094314be1 +size 199058797 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b23fa470a6e10b36b23485d0c338e03dedcdcee --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0151162692987db3f9a76d72ff8a2cac7791f5754c252b6dc0e0b82cc71b7eb +size 199058605 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7993d7143d1bb05893309163baae8e469812e40 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9e7248a4e360258bf9f06c92eb370596cbfb37ccff19fcb3c5612b649286f6f +size 199058605 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8531f8456252ec0197e46dc7f1a91463bac75a8f --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb0102279005c169b2c8005a6da32bf421e0347276228d5e4c3ef2a574433545 +size 199058669 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8cb00f79aa0d2eb129d955ac20eff3744cba123d --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff866e09ab99ee57358d6338becd77d52be683325e1e24eaf3fe47030afda04a +size 199058669 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d9fe54099ebd288f03ce33598aad728dab7f3eb --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21cd3704acd7e80c038c115c2b883be8caf17f4245af50735892201c7e6f9cc5 +size 199058797 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5eb5d417285b3e98c27ba4c6699e4593fc04b272 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:272cc20277c042ae398a064caaa060614f07c43b3cf78affbda297851e573410 +size 199058797 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3ef80fc0e74383b737c2f0a16a674190aad48a2 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:349b3c939348e3e7729d23803f05716771e2ee36b6c8299668978b075cc9c42f +size 199058733 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd70a5ced5e5d8ac81e12e2eec13adcfc0414483 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:984487a9d08d774ac97b3eabb3b092e05d7a730d526f94b2e572b2def054e452 +size 199058733 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b0eb60ddf329bd40c54a807e8818100f6e92a32 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2a048b80e044c12956b3348cdef8eba08bee70ff4e3f6e7b17a3380d2c21abf +size 199058733 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..22ee3033485d78a3675d24937fdc373672f46d46 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c961a0f538abc51cefaff26f61537953c126003f4d4c74c149587e5a4a1864a9 +size 199058733 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..88501768f5c13d7bd3a1692a52a81b8d23c4ad8a --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a30c120df03c40e8cb62a61529de990eda6fb80cd1554e9e1c529d546ecd806d +size 199058733 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d34a273e819ceb43ae644b1e880ad60c159b7ffa --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d80059f7c57d71bb3be4b72a54581e7561ad3ee1fb2cce75c886071f920a642c +size 199058733 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1491b44370310eb98663baa09a16690134013d6a --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7c42c2090c3055fafaadd29dc8e687bea95165b3d7779fc14e01f1f95c360ea +size 199058797 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d48c93d2bf0dae9f4717e0fe1d586e2942f3c48 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4998cf3e3c3f88f0e5faba63c84d5a7631d2a4fc7562fb57eb358c9b2ff21602 +size 199058797 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3fcbbd6d8a1cdc221fa427921c78f65011a3577 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbd3461607371137b7661e78d1cadb56e51e944b67952a90400cd4c6ad4231eb +size 199058669 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..02d55002a4f13bf256c61f362404a9e2517ca940 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bda7473567427112e5ca48aed79111798b1ccc51fdfda1c71ea2cebeff2c51f6 +size 199058669 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..80f91227f4c7f57514b4129b79fa083e4a9d301c --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba25dcd405cf271bd90af04521c14b898e341a43b12d1174844228e1605e47c5 +size 199058850 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc24ecf2fb4647dfb614ccd842b103f5019b8fae --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4a859aa254bfac8378bc652e8e3818eafc127e9b18b40d19e1d21a85c596320 +size 199058850 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bfcc32230bb2195f77d6c32805610eb68ef8dc0 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8690eb4a14c4bf48f70eca3800caa977baddd28986064ceb936af49d0b5d2b34 +size 199058669 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4841e3e5c741a8e1d107affb8013120cd542c118 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f44eecb5fd2a741e4cf5e35d7630634da47fd16779e6971411f00e216892b1e5 +size 199058669 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d91bbd0a1857e75b1874c8718cb62f93b0d90525 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a21ffe9edb5269755ab24a193a793f88970fca004f66c476ed988ffd0eddfb4 +size 199058797 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b36f71bc0928d1478c7c20d9fb39e82cc79024cc --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c97b92e440ecac6dd91a352e00c2582f73c29c969c3b20672f6cbf7c253d141 +size 199058797 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..489a2782a0f100cea4bfbfd070daaec8632dc902 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20387a7524451b53086b06d2bf648e6e650f03b303b401a06fc1dd445a70ef3d +size 199058733 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef93ca8e4fd147e4d71a56c5de980e727308ee11 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0259e1b4c7a3998c40311ff9e53f20feb9e706531ded39ab31dbfdd2a2f4d4a5 +size 199058733 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d606b93e4990cb55905307d65b51615b8eb63895 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:672996b3cea111ec772fc8e0508650dda272a144257ecea1e1f0fd8ae6a44cd9 +size 199058733 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe24cb98e6f6c91ad7f1ea86452cde7b3f74e55e --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9b382cfe5645f22f6cf8069598a5920af4d1b55b0539f503a470f2f487bec88 +size 199058733 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7192f0ba274a837fb374ddb415007ba2f0ce3259 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a117a51ba9ab0183a109be1fff393c42090052d3f0e8ee83ecd406e55e8fe34 +size 199058669 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5a4a64be7844c8dd7761ebc7db688149a5d3dc7 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68ff43c0537a4170575bd0a81ead5cbb31f3c419a09bcad903f813feba707c3e +size 199058669 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba91d5236f4e2ba4716fc4b08c87395df6ab5931 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:307086deb9e1a9f2f926c7cca3be18b94aae4f91845532e391af3c69663657d1 +size 199058925 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0222d0a58a1634b54dbedb2a31d4f1b98b21fe98 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90085028efe9a76ddcb6294d0b7a3d9b1e1028536f5b5ee05ef519827fe7f831 +size 199058925 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..785b3c2d9168f20afdd8c7079da1a76c184f5c7b --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d50f0f35b6f14a9ba9fa60d707473917d220b4dab8c88764f61366382129df4a +size 199058605 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ffb19373023bc7596d097d6781d70b6225accd5 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:233e81689708f37df52a2ab39856d8f4a4d9d35239b6a4790fdeb033a5d8f4b4 +size 199058605 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..13cdddbff3bae72b0816ea66cf0abc33c933a071 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9335d3cd547b4681bccf9cfeec29dbe14d01ef22fa43ea6c0eeff25696d578c8 +size 199058605 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9222218d2914b1c7663a01489db9cd4595b1d405 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d270c6d96fc7ee72a85f6196c1205aa21e48ebf1f144fe7a0c070b369e06e374 +size 199058605 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7da1085ccbec7e19be99fd7688d7fa4781bdf592 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aed7781a217f3ae40d78c9a703e088e84578be325e5d6a768536689ce3880a49 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..207320dd91114195507253c0202d83135ac5c27d --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93cd02491f627caad10a892fe9f18ad980dada2e39cb6961183b56a6fbd10af7 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ff6b63379d2fc4a73630fcce8f51f17c623986c --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12341cf6408d88b0e51fbf6014ee2fdfb590fbe6e38714a7ae85ecaa6e5cba5f +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..75f2ade9aec1894ee1daca0d33d66464a7c2845c --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33b6ab0ffa2f8fa04ff5aae50fa6ce465734e912ef9c42ae318070b21cf7d0f0 +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..076a33e3efe2d9b8c418e793bd9a6dae1d65f5b0 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7811ff9f3357f8a6b004cf7fc62f5c088c4a42ace678d78cb05cbaffbf64394 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e39a8b05789c4ceebdea2d629dfdcfe53e760ab --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12be0eaed52ffbb86be88369450b83ef06ee58387222ab266c75714773b53a74 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf1fde9795e2a6601b4f4aaf2c3e9f4d0bf603d0 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b90ba1aedeedbf8f46d785c16f421f8d1c415fb7551222444473a68f4d4fa997 +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..695de812ec503b26bdade0f2e7dfdce76f03449c --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddd285dd12e7c5b9e3c30bac101de9ee2bf017260f30d66c9e072f4c4f59f5bd +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e645a549186d5cfa50c6ca3087c55153e717a763 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:973761aa531f51375e8517b2641c8dd947a0da4a969f2b1c6319634566fcd918 +size 199058786 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d0daf2d96e2e5432d8f4931949115028fa036a5 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecc7fee3b65cd3e032999ca33607df8a622fac19558a3a298e9bd2c02a7e97a3 +size 199058786 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..473880c28aa1eb349cd61ff7a1242ffaf2f39138 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d68bc2e5f2d1306fcf0485844429e5f80ecc9859485491a65a55410ffaba810b +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b20bcab6666f4cb23a02632e99823226137eb112 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a968630fcf0262cb95b0b63f8f9cac233e51087ff45bbb3ed46d17899ac60289 +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd03f47c09d02ac8c8f3957aed54ebc67cbe8326 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b85691c2c46b5fd1f2e0b8f676619b84edf27e0474a655503567f65ae1435ecc +size 199058978 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..65d3107283df059201fe0c7081d4d9648952f059 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da7909e75052f85948fba7d58788de87ad338a35d9f25834ea70223bc1306bb6 +size 199058978 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..479a6a8370e90fcd79854c233551caebb7318312 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3f6c60cd9f8075f22f13c133fe0af2f461228627e987dac7be2009e2c0d9218 +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c31e4beccc012bb20d17fbb7769206918e91fe9 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0d34781b557262d74d5b14cf1f9818887cf40f3b222f171c4cd1ef323c2a5e7 +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2030b07e231fab3e11b9159be6e7a4886af6000 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57513b72750a0f5d8834fc78500053d1ace0036424786199978ba9a910313408 +size 199058647 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1816695b0d67efe0ff7891b21d4b1ca91b64d834 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17df33fb90ab6e95f73d471c5696d4dcce06123bcf709b9015a9a3e2275d5cfa +size 199058647 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..111b6df33a5398d28a0117c25e2b01c96e528b10 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2653a5256f30044feba2c2f3b1ed1c27cfa4bd49b4433843c00c367be786b0a8 +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..442745d20fa62af59d440d00f86ca3c52156f636 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:611f2217ade9ca3bf787d9c7e19884b81aa728c6cb87982a39ec0eab6acd700b +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..68e1c42f69c0b741143588138dadf9572b41e161 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:898f52c605cf523983f62655410be91e8452c828ddb1a4cfc927b101d790084c +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..67a8ad98d2b95c25095a6cfa9b24664855763dca --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53422055d38ec398921a3ec433969336e26498f23289809bc6a4101c2b5c0890 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..289737bd3c56f15a0fe81fa4c52204d81cd87b19 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af192bb07d3baa518f99f81476eba7175e45867b3d53c0354d633438ae69033b +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfca4aed92c985bee41f6dfd7526997974590ea3 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffb9a8d1dcf96d04a24f6ad31d22b569747a0b2508fab4acb71e2e515916da53 +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..06d127514a7273a04c04cd1017fff1b3df6afc2e --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58f3194a19cab2c50b76f389e4d4eda1a7ca973f6f5acdf9acd0546f091a2c62 +size 199058786 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b9309eac64bb8671783f9ae6714aaa8af4b03a0 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6cd910562c4330654c9ff8b921fe0967a312eb7c76390bb732412b13f5ff0ea +size 199058786 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..34ac178dc1f9368f5ba9dd1a776669a2ef37b4fc --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66099d56f35cef8f386be76dde27d2af4603b586e2c6dec4ad32130854c46bcb +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..255ba1994b144021b979a7ea90270d900fa4c6d9 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78e926ba5d33610550460d07515b23779dfefac9a7ea743773f4630836ba67d2 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6a03f494691396a4f4818b800b6574b617070f4 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:306c8f6baeb13be7197f78bc8e592cba329a7fb15e6dfd80e8563b0f7572f960 +size 199058850 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a95ea9d3e7066141c06670ecb0b4e8fd80ae631 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f261ce2cd2e2de9087c39078bf95a5b5e52fdc8eee268a66c24490acf76de4f3 +size 199058850 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..34ccfb45841d32b3e4e9e3374e2033e41529cfa1 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a13d8eaf4c6f0b1e74b44dd0e17ce57e4888f158c45fd4b1ed7815a126d5f84 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29b5e9f0ff7e55f2ce3f2453f48bdf3512dd8a20 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4fe04bd1720d4622bc59420b3fc15911877c3abea5ca5c8a78f4138040426cf +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff694b790be042f2cc327d5015927bf6b6f9bfd8 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f6605c1f65fdcd0a5740848c3f37bc9456fc7ec9dd332bec0ae45412a9bf948 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aef0c528bcb719b7d5c6513e32814fc91eea12ed --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cf399f962af996da8ece1257634fdee2b25f3492e258d2c339c031a9ea023c9 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7772b15af58a1488a4e7d267345887ef41e2d617 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7fab932d991bd1c2bddd78b7eba79699839b8b3dd5b7a563c187983339a17ba +size 199058594 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb3fa18d954f9366482859f67a1cfae4b5d8ede9 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06b11d52fb7c77f90caee6acd5fdacf7f4a5165249d6ed564e104c82f0e986c6 +size 199058594 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c7ccf39c459f811a77a552308674159555d06e8 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6810ce8feef76a2f47e8b8afff70c2dece6843acf87a8ef037e07069894c1def +size 199058786 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..337d2a45e051953abcb426a8326abc4d932e16f2 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ad201bc7e7caa8b0aeecf5aa7958cd6adb4b68d8e24beefd84895c4174e38cb +size 199058786 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..27e56159e35d49e08de53d5186866977152a3776 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15ba99e529fdc1da6ad380244548e8c447ca5f204263344414647cb2bc39345b +size 199058711 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdecd2b93735712d8ddd641117d32160746bdb55 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca186b1f6aef9119d5ab5c4e85bc358970e65295faab35c511206c90431a477a +size 199058711 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a526374951cdc9266080c178dc6815e490d7550 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45fc4b9505a06d34e286ac14bd53c16308e23deac4b4a5db3740ab812d0bb9d4 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e552204d822f0ee21a9df2e198d95f3a0ae1c67e --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccd34a3520d27d02725fc083bf71f4c754696871a54f07f6aacbbab192656a31 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a812ac687c1afa23bd5c868faa634f7185445537 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:368c0aa2513b653c2850119895112ef8887401306d83b0470e3fb0bb06c1f2ae +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f49e9b2c5d7b6a26ec984ffa000a95381e4ae9b --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72172cd6c6768198477d7873a4449a6a1bc57a32af674292fc84bdd9b64dd476 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..edda9b0ba944f8ddf3ecd46a37b91ec58f7b02de --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9c51728d0955b42b36daa9cafbd560d8ce4ef86c406030f00733e04833e3e53 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2735365f8ac0cd48738fe2ded66b056a31b3fa42 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1df6f5b1e4c992508eb6dc793f4dbd25c57bbc759088376b002497b7515ab01 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..71e3fb5528679b7e71f1a0f7b4a0449b5ed0db8f --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eab5fcb549f700f6db3120d1b1f69eb5c6918ea8006e69e4257e1dfbe6e0f387 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5fa4f1e3453fddd26327ba03a8392e32f1ed0fb --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bddb283b96211f09e4be0b7a7bc41148a4a4e40eadf2b3b4305e8493e4899cad +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da13155283c0c7b4056b717ed19c1983018b02c4 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ead9b8a50bd22e651a885e4bca369af12cfe881de57d4ad69899fe8cf0f5e1a +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..28de76aa477c06d34385c26d24df9b9573511603 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:529454abd4e31f52f9799b412a47b912e7188cda38bc8229c4d01b98a4885f11 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e24f327cfcad2eb58b20a1e8330c4ce9d14a8a91 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a20011b7026ab032c455d56f036285a232afeb11c4fc49b57c48dadf14bf723b +size 199058594 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e267958b5d17a54d0e2b4a8b1672dc0f115fe47e --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b25860238dc31d8b698c6e0e5c445720dff5f0438b57fc68b162b3c8cf2ec61 +size 199058594 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c96d4b6c032a15d528a7771a70df43e19cad51b --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffa208c1a5983470b5de496a046d16e89d9f8d7192b204af0418fbd208cab20a +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..34a69cbbb99862630e37e6eb2aabc6d21c2a910c --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1485a814d41df34cad2176989a6b8c58aef0550ad252991395928448ed9f30ca +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4766105ce3c67842c52dffa3d47c18801de45c17 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea62a3bb0c1d9fdb3f33146f9d7e10bfc29d1e51f053d75eef7d4e63ad66c9fd +size 199058786 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..08626e34e90b7d1202b189065b88405056aa8332 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18f16c2966449362e284ff6e0635d2e2edd887c5fe992e0f43c854af4d45f73e +size 199058786 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c158532bf4e895590a68b98a76f1756ec6962469 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad3eb948b1935d28a600ddcced4de3448ed6e2b580c72a8c25fe519707d7ad84 +size 199058850 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..01f35012f8941b5ad2c94dde33d5dc6fe26a4d6d --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f812fe6b01e9ea150307a0c4ffd5881f1553bd376029d1ce4f923bdd47f5136a +size 199058850 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..edea1bb3387c75da861b8dc8718033a27c668851 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14197859839b201ff6b9e42a2643bca9dcafc1632abb239962e7cbdd41b8a8f6 +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..39e07de18e16f2e41b790920ded94614686d4f84 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51f9048aa6d8c210211214fbe8cea17c6a68384f5f27f52e2f2f4a4e9f5f5bc1 +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4bbe126842732b6602bd148d426bef963a5fb87f --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:754d476c053ec4cff6a8df927a6c5bd0d3a22b2a05c49bd1cea8051901759394 +size 199058647 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a8197bb9550ef575fd36b6c97e0b2528b2e5077 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a0e9577491ff280333fc44914e84aaa90b8415ab493c143b98b984bb09e0145 +size 199058647 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c3c9958b51396c3327bf3ba26abc4d8729c7005 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51a004467b899a1056c3a8c123dbbcad22ed2f2795459797e80fe7e0016a7ad1 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f8f6c8198a2ea1af3e33cd9ee51c49061cd98ab --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c6a12b3d7324bfc14882ae4e1aa475902d5715f6b4ce55cc6729ff1e878ab74 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09f8dba3710ff368e816968f8a6533c19f75b7f9 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de521b761a2264d4ad9d104940b7223115a15a10de0ead9405777ca199390fbc +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f6957aaaee60ddfb5c672c6071f5620f337f250 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9019c73d458c88602fa738f6bc6891fe79b59d909904b3e9160847dc55f81e08 +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..517616a697615ac61e712fb6acb5518653174085 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7306190ef85c643bc60a89591b1001d8985fab1be422d0de71410c60448fc1bb +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc70d3465c5d8f18681cb5f5cee72f916219e25f --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc4e2a1d6abf045ed178b9e85352d2041ddde4f2f0f14005a6b1a12a9c722dca +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a09e84ae0b1b46c829c5a90f78f073d365b0ba1 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcbc9013dc9f23417a3f4f86dea4ca95117c554642e24392fe90325166c2bc57 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1ba4945127c752e3f2b34b16e6d0564a918c667 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dca1238f3bb81d73455bb32f800a10eb6d23aed9210a714fa6c4c016e0f5179 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1bf93c18066ffceb8af43f973a8c303868e521b --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d252925f4cec33a9080a214ec07c87344f9c489bd698ab2742db5c31756baea +size 199058850 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..60886f6439cf6afcfe799fb9f8088f4e2860edde --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbdc99e7d959812bb107536870319015e1cf27de9babb533332c2e9212a7c836 +size 199058850 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2dc171373158d42450b61632080de433cff877c4 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c1ccd3eee26e0a5963ecb2606029aed8ce75129e5630611d6befde497064bb2 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..858b646c1fea80553e7c390dd0c1987b7f740bd0 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d2d4d5f2691ab1af7b427f05e186c0bb6e20b96ad0b42207ef8b8b1387cd999 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5d4eb9d1e2826a3e88611a57860cef7a262b0e3 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:677b7b4ff2bfb145cd044a9741c04cf20a9d4a15cdd8edabe08ba0a3caa18d1e +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d24fce18ae7f83f27fa10ef09065d2ebf14b278 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dc22e7c59757b1f2bf679b591720f6a6d0fc351fef534bd44009c05cc330145 +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1fcbf13ace2e5167d1bc904f5efff595a4ab4c8c --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cccda4143332dd23b841306a52154826e2c8a1f22afb0bfc891cb814627d2a9 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbb394e683bdb25bd83fd0f7eb3821929822bdbd --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0d66cae148f04831e1810c37aa78b3d8a0280632b44965b89d0fc1e4da1fc9e +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f82eeadf0bd991a300f6b699221a845c91adef24 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45546274b12aa5f514c1583cc0beba05978b24d74baee212cde1126150401a42 +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..42fc1ee01514d460d7999cf7ec03c11541991814 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2202de33cb8b7afc7a15b557bde3943615046a886b9a1e5823dea170c1793d80 +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f93cf5b9221cd224d92a62afa92cf230d38b2e28 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeeecdbc89b812e6bbb108e4450db60a50b9872f43a85aeed6a698e805253349 +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b9dc6201ce1297183257defe22b8924fe7ad6f9 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8469848fe5677a66558103dde493b71b05604fff5331499ee5fd5f71d5b10a8 +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a15dffa95edfbfbb822c279caa0034b5c663a6f4 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05b86ea1d4d05fda7c5ac387b1c318a4405025247b893b831b40dd83fd3d6d50 +size 199058775 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a31cd56ff95f9d113c8e1b66ec2cde3879b9e4cc --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b29a173e846ad4c5053c2e914f5c611249987eb9c6791c019deb31419593e919 +size 199058775 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..86f59c517a1b0e199584ebba66c90d6dd65a0740 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d36c783d7c43b01c69950ba174e896fab8ea15f829cfb706cdcfd8310e524f19 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..efeeb0a113e58794ef7ece304eb779ba207d003b --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c1bfa8f0d7e55e1172363a0b573c90f56a51a33dd027af9c79119446713ffcf +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c32813be1c41c8f4cbadf163ddcbe39a47795085 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0c0090173cead23223a7226a8b82b39528f7674be1b0cf043a57273c687d326 +size 199058850 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da0cac647b117667c4b43b6de64ad76c45065c14 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3a080786bdf6dc097a20c0c2b9e798333a46831ef8783c91e0670d783305e36 +size 199058850 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f29ec9f7280686a0a79584fa42f931715315b98 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ebd3ef1d051a7e21f052337e75e5638e30e4658a0690b05335f45bb47bada29 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3c71ac4e328b1e0bcff1b03146800049b7328fa --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d89ae7306f41779cf7753632ec5386d49d1ee70fdc88a07027df7e562e28f8b4 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae2d2474f0e3910e72d03726731e5057cd520c65 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b179dde4480261f57e8c1e25dc478f699078454a9b59a492040327371c31f2fa +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1799e993a5c29f5f1e87ba2fee0e21a82cd770d --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6496cb64c9a16365d0fe25d78630febc66c25e3b81ccc957bafa449f929b9e7f +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6653b982216aec3b157157d9e63295c753e5d58 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6c175b1a97c86fd65de5361707b0f2dfe6a9299d94f887ffa62ae6f236b8ae4 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b73854138b2d66c9cc6701b4fedb568f572eb88 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adecd32e9e4eb5760c16bba681ff7a2ef93c0276482726e1acf8dc27870164c9 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..341dc9fced0cdf224f46b644c5b6d76226133e41 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:feb51423d97de8800cd0f8902f548a1777063cc41d4f2416d0521059f32d92b5 +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e06aa75034116407cec4ee22ceef0339c9bf2d0d --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c05e89f516ce306bfb7e08c582380f1cbbd2b52af82c4f5c4f9d35bf8bd80b96 +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e1ed0893acc5c760a483383c41acc01a22719fa --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd4c49143c5eb1f03372f86f21bb723cbb1db7dba027317400ea31c0ea148783 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9780325768b7a462f12d8383f9cb942a364aa1c5 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2145da1477df0bbd1eb3df3bbc703969294692276c2ec00c7b05b3171867785a +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9971185d148571cecaf877025e77d133de278ce --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53c02f4a68009d33519709d23c7493269c7568ffec75ebcced96abedfdf1312e +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..59b9915109c69292d7523c697898d607cf598848 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:421d2966c038852122ff3d298aa5e1758fefbe60b532e211a4b14843d0f3b298 +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad71edbc39eaf24fee151e060efe904f06a15af0 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22834e0c19323cffe3182fc81b139878ff7b4c4c6511e667562ae658a388cbb7 +size 199058914 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e48b2c4bc7dcda4cab8a6266bda83e7be8cbf60 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0540f39c78292cd22a2e1e11945258f04f33a013c357df9dd71e19d0874fb56e +size 199058914 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..16a622ef77dd28b43e6efcc3181d4fd78f8ff51d --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0342c4b76e4b326bcdb26aaf1f6d5ad39f0f50550ae4f6b383f28fdf1575017f +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20dbdc35308bbcdfad1f1c835880deac0d97a7f6 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24540ccba82222d8ee5a261a7f8c4bf9f744ff87ba9b9fcc9041927acf33d700 +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d2473e455c887f3054da88a534072d127ba3f64 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dad78ec178eab6d765875a89adbb37bc85050436ee5da303c0ca2302a4af4a26 +size 199058711 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d0c1f6cfb31be6cd6e7f82f6911e7ef9996c0a5 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3c02959dcfefbb2dbc8d35d490b1f002caaee76759b42d06a561fd6c2552b08 +size 199058711 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb3b10987ef116b5451f5895269e3a4d46fea207 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3407c0ebe02ac458ff7c8a0efd21d8eb283bf755a8edadb00249929ce2c3155 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5998263ed2d68ef7be20a63c2bb35e29cba7cd0 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db520db8df33880a40d9a47310f0e095257624ac68a867078af525c51639241f +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4814f6ea31049b6ae521ecc97d294e38daa5f7db --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:014385211702e333bf3535d23e9ef4911c2246a490901f46b68211c9b8969053 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..791b66928c47b02d7fd42abb5a47808a27fa8ecb --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9776775cb7eddfc7c67f3bf557e917bbfb68f525c599732a1d98a2523eab0b8 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8eef3bf7063a6a2b46213e65f8f2bae89d254c29 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16b1e25659407f633bf58c95fe5851676ff4a310030ca92b445b220fc89ac383 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c76e23342b851bedc9e3bcd7c6c31aa32ae686a5 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16ddbd51bf5ff4f30c0c4e550ca6fada376cbf53917a8eba397983da7221f342 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ecc152af743128c5cc877309e109351964122298 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cf4a6bf684dfb0ab6e0511201d4904632c4cd4ee897348531bfbeed0517860a +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c47dbaaf9a4a5f16ad4be9e0b5d8ee9f33f5069c --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19e2d11264ea50029b54e72279d6306931be8888f40520d46f85bce2457bb712 +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d12394bbf777967cb13b90de95a102e076f185e --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d04b56de4b9f6ba9754d346cbe405088ae8977e7073dab3fdb648eb11335cb6 +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d68261b26c85a0c0fe1d59fa4d331db52aa7ae0f --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39aa9c80e7021ba5cd1e97ccc1e57722302a6cc3fdbefcfa6e640e1e5ce99ab1 +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c3788803380de4f67bde8d06d2059368537c035 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1b66bd65241b5d97aabec8a29294a52c12541d7a3aaabf04eb495515b6e2274 +size 199058850 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9d87c5da65da6adbc45a3f20b32cc6207f21b88 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c283ba36084d4428d432f32c408bbc2c44c9315eb81e82608dbf259446ec0deb +size 199058850 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab5a0782be7e9ce34679564809e4d62730d3461d --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b8a9307aa98af16aef312c06b479f14b0550621927af83ae4342c3fe4544147 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99f9d7a8a77ea4b3f867c027983d03bb88f991e0 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e14d46c294593e25f9787f4609f43e7ff2f12bfe6bddd9296d0fe94d9dc2a75 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fade71767b13052d5828ab83c62b11d1e1f894f8 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5dea0118b7410fafc0914b50992da11860a037c23964bb05d5ab0052095ada06 +size 199058786 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6b30579e00ed7a4fa969f1fb601a9ba38bff21e --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b95a78951e8046646c115ca350292dd1d0044ae0244828ed92b792cdce4b43bb +size 199058786 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3924838782381c10b6f9fed7622f7c80a4ee0fc7 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dceb9753664619dbf73d2656121890bae00ab126fe55a628ad5e4f823dc17f6d +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdc159c70d51a2252912a14937b57e76f7487338 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65329daaffb70a943ab178ffa0d51d16704149ea922bca31b86910166ec16989 +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..75e29edfca744ecfc50f984d3136262ae777d36c --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:971aefda22b19a10e26202802d510517e8bd642c5f6df29f9b7a024fd9fd67be +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2522464ade818a7244f352de7e767b18457d310b --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:235367bde4394b18fc16fc624a83652f1d41d96cb615f1c7ad968d13e69ae57b +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..26de05821336ed50e4a81e598aab5e9cad3cfb9c --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:793c3c23f23fd5f5167847b962d7fcfb8fbf02a69ad2c837a793093059a3927a +size 199058647 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..189f89bcaed73a131f77fd56a45858f2e92b9b67 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68515a7775bd82bcf9230e7fac303034d9602af24bd001cb78f6b5bb430f28ff +size 199058647 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..171515e3f71167bbbd87ab0fcf0fe8f1122a7b3a --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eef30bedd600fa3fc6e09ef3eb29b07006b18a2edc8f458763196fc484a5f6de +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cffc5f8e2f3ef9b4e79e7255f38005a391d8d94f --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b27d625907e46b11a5320157d7da583d80dac9b0855c733488aeaf750d0a4e22 +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f65a253057fd2c8a1fa6e546a19a51c9cfef743 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:030e452179eca0ccd745e15c55aecb073a98fbbdabd02284f5dc048ac8fb06c9 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb6d8ec2f75c03f1dd52e30b6662f5e213c14cf6 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b152d66593d07b33d11d950350c4bb2bd1a897c782635a1a702f771ddca53f8 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..46a56a61758acaf98592d51e9aae143b8ef1f6c9 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c40a91f0e6a525bf23af9e799ff1d12986765286e225f01217c749c3dcc0732e +size 199058786 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..04753e3de699ab538fdbc7e0ab44baf2f81a4bdc --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b85345a9d9dfdd94c1108b72dc3757a8407f4b4d91afd4dbc2cd1984e776cba +size 199058786 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6eb499ef354e5dbf52c1747699006c896d1cc780 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc5d0707901f06e87ac9e4c16213f66214b70be3278f24437634a475dc55e2f2 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dccd685a9011876af1942fca0fc2a0929c176fac --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:869d58f579045516c48ed73125d3daddf7a145c022bb6b7dfe236e49d8f1f108 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d014459a893a5f655c969401fd7761fbd6511234 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a5379a7f2871024334a3022918eb23bb614ecaebd6871c506c932372794ddbc +size 199058786 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee6da074e27afe0211b1ffe721d8cbf61227bd9e --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e25bbedc33e30ebbb99534bacd2591e87b962baef8979aa105e382558a34550e +size 199058786 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0d637337b9e6b976f1b127b79e60f07375ac868 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99f12eb317b31cc52261a10e55dc87d709c6240e0cd16a8cb710c29e383ff4de +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6685b4c96a4adea3bd69ab7d231b7d9df52af58e --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d648907bfe0cd3f4cb443d62b02828153f0c4ffdff88097e92b5560fb51958e +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..08172167805a14676dd458156ca6713f35ed3cf8 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5f69c3d3e21184a93a398c0e57410cd24fc37f64c4e691fbb3640db7056f593 +size 199058786 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f404228a3a73e2c499c580cc143f92ef57c70af1 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9795a8fbf3e2548543846fc5c281582ec4bbb167102ae52ea23c92e7b59b13ff +size 199058786 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..325ac879bbc5fde642f49d45e17eef4bda0cd6ad --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:138b5f61b33ca72276f43637b49d8f5bdfda7fcd40ab01553dbf6e9e4292a381 +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2c8721a813abf35de2a107846f6d486f276d5b3 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee992532831c699a68a30013164994ed459fffd782f4e576bbb8d5562f84c6de +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b85610671037af28d8ff7a275350555399f112e --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a20cdad9cd1eb418cfe520485249554f4bfc41aa80ec9bdb956c8c4b42b5533 +size 199058786 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3852ce8d923b4da1c4e1816d064ac4c4278cd8c --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d87e8dbc7aa6fe7de3246b1ef044ae4c1e000e8838d995f15d48e31731e41f84 +size 199058786 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..632e72c7b9f96298f55b76fdbcd0378b23d5131b --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:891f7eed74c22141b62cd93da6ad9bb97ca80a1784c3e695c122d14d3d0b54f3 +size 199058786 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..66184a7a07080eda0faab13406e030964d011850 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a76a44d66c4f9e4429e556a8c1634bf229d1698d6a1ebd75fdb7d149ecd4e336 +size 199058786 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..302b9f0ca2beb285644e9d4ff9d42fff9cdaf510 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19e374b73d1a968757923914243239b758471394699c5923074ee37991d2b6c4 +size 199058647 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d99a2597416e062b05908ca3548a097078c19cf2 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ea5eafab950d0f5a03765954af9495e362b9ba8e641028be5f9ae29f9639c8d +size 199058647 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcb7c3de08cbfadade0faf81b7a591884e78fa29 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faad2539f06c64e7534881b7167cba65d652492c2cca42d7fbb600fd139d8459 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ddfd101acffc9f1002a61e90cba1af8c1ae4c1b --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17288ea571c9fbb221c7768862182735cfd1141a8aa9cc6bc766d451e0d9e75a +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..81fe4e1524c850bc0c9b02ecb1442399f3b04c29 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92c8472bdb8c11a133d689c8f130045c8046be7de640d86e136156261f8d77f5 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..266615d8f87495cc9d7e32581d34807ce5c7512f --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05a8ffb597cbba3368fb0bad98ac808499b94a6b36a9e1f8a4dcd11094e3dab3 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..36d58583ebc13f5fe7ea71ed7429b700e75294bf --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a16078b7807b3dc2ff04eb9e680d8fecd3b01b05dcb88e7b9e549671111bc9e +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc6a47c430f2d84164514894bdf9a7f2f7ccdd46 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4931f6489141b4beb443469755c1fd656a400d5eea2f4459998e1b0760aad693 +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e445b22c3c91d7393a2bcd397354f68c86e5ef19 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18334cf38645f98a34adfc1f041642c64e19268e8d4a29a140ce5004a44b6f29 +size 199058786 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..733661e5241bde07e936cabf38650337b0d6c959 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:714c572138bc3da39d9e36127d3e9e2d37759b5799dcc17e6243fe935c0b7319 +size 199058786 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a60eb616c0324fd13ad40000288df634b1fc4e8c --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be760d08cf1dc6347d034272c75c2e6b13023edb69f7df49a2d64d9d60953928 +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4fb5ac24a6f1143f8aa615fb4c86d2846c76cfb4 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:caedc3656590a8bfaf06bf27fdfbbb7f0cb2ac05e17365b98469eb912be16b1d +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc7559f2ac54528a09132cdfe3cdbd6770d58079 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eec664802ef4c3668e92dfd43baee58cc380f045f06dd159577b0b568efd266b +size 199058786 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8a2329322dadb15344122ced9634fad08682082 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b1836b877ca101aa97bb98f9ae3fcbcc466e05a7f8639668fb44483f7bbe5f6 +size 199058786 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..edb30a816589304ccc005cfbe9369b6cc520cdeb --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:696f3ff4ff867ca2b172c1752bded25515fd322486c5849ca3f2488b9058c221 +size 199058786 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0cf8bd7deffe8a12b150a1e0752c81aa4221660e --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:462ad3ceca241563e683685c892723cf85f65ec4b535c5a5c9af996b0e20e611 +size 199058786 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..475df91d8ab4bab8421398debfa3df53e102834e --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d23c027da5c530d5c0e794ee96949189713f4a193110ec25529a0ddc9410a56d +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a910f39123fce9dbefece5a66d6dd494d58902af --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c619802bc635e3adc48828e1abd538a6e7e223cbebb87cd60ed84d9094c446a4 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..12d5b6ffae35ee5cd45c455a751621b4ac410c62 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e560afa5616499edabaf0216c38cda1c3ded4932acf5edf757ff70fbb518c55d +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b07fdf8a281aed2236ec9bfca8f035a72e73eadc --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb90b28068ae303048b9989da1cd172f64368a61f7cc3e46a6ca689dd54e35bb +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..024997832f3e6f0a5a3cd22da448d216612e1757 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f5cca45514a0604a5618d1512013dcbc72fb6624134993df7fd13625652342c +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..652a18b02bdc5ec73b3cbc8b190f6412c5751b9d --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:257ebf98688529be1e72fe3cf9c4404924179147a956cbcea0ccba3e155885b2 +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..89f0faacfcab96fb1ce55e7306a996659299fbdf --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c72ad86a86a881fe9ed1e1004ef8314ad0c2df8880c4acb90f59956f89fcc27c +size 199058647 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7e1c7096b455aabc144c434637474bb7c89845f --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26f8efccd2459fd17b9d4d33dd820f8276ca60a46bb3006ee2928bef25d0ca28 +size 199058647 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7adad0bd74a4f8d0fccf874c1fd0c1e25a47a11c --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70ebf9b4206a83ebd7a02572c80c3cbc37e9306068fc74e3475ef30bc778509d +size 199058850 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb90a0ab5c0d4c8eaf2ce685af023e16362a6e68 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37e7a52e5cefc60eaadcaec933578a32738754f384fbe5a76d0c13a39a955e3f +size 199058850 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..18fd2363431fde3049808193b9fd8c8bf8b8d057 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd8f8bd35179a6b8f9ac9300ac785123235901e5f781c560beefe809731c2cc6 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b07745feb2dd3e0af8e44afe103340548422a1e4 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bddf0a26c1ca8d6f730c2bd0b63fbaf9cfd52f88583559d9fd3b536c63d663ec +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..621b4c3b8440f9a2c9098ac508ef885f4c1a2a84 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2359a3e2b45862fc62db3eb92acb5b6eaaef7f6ab6c3d05e0000d9ec0555d844 +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..58a8904b70b27589027d5ae1ac1d98b6a3c775e1 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5220d188f637e0c2571ec7926205b59e02387c4422150060ff6566b751ce4bfb +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d479998dfb99bf26b9ca23ae9b5a47513539986e --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e31a0ca78359299d8b4bf0e37ecb9783b2fe53a7a960820f6d2d777dbbadfcf +size 199058786 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de7752fbfb3ed2bb08da44ac110b6edf1eff0299 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8112727b67f90dcf0955dbfeeb6ae04a3422d31f02efb7c7ef981ed5aeca2c39 +size 199058786 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9bc17cdaef480dd066d5e7adc97c1449449efa7 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67dd2322892663613236cce60b1bb854c16974e1ab6aeff64ef572d913121ea5 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..505ed90a3ab7dcb76f94fc110e1bae10c4fa5177 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe14e06c6d40b1ff1eac281399d7ad28741234e18f48e4ef6cc0f060a75ec690 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4974a930723972ef28441dd1f723bf55af22fec3 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23ff1ec4b7edaaacdcfa2fef669711f92eb9fe52df28122614b5bb0ced8a593c +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ab910a09d6c3c2a6476845d06a5d3bedf0f8d5b --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6481cbb9c24253e95cccc6dbccf86ce7afa39a9b935253abfda472b9ca4d0ea6 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77ce4b32c42f54fc4d1db0ecc1fd3130fb80c7e3 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7252830b367070760e399bd919ca18964227c431c95d766e58c8919d9ea8ba35 +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1fb46b71519f547bd2be30d570f5ed249a44458 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae086ae83b4cdd1746327186522f3d1f260cd1d42d6128f09695379f4385546b +size 199058722 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..621432a61e60e70e5b9a377954cdc893820a96c8 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f3d5f32dc010a8870655764df5d74679ef2eb00447fe637d29c0297c3c7beef +size 199058786 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..504499095f6ccd9d035efaf53ab273c7055668c4 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edf33621f4d60842ee16f8e7cc9c847856b262aef92e281ddeaaa03385a2d626 +size 199058786 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a08c96d41da788c3c613e20261f72beb952c22b --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fb46789a692d64939e1ce34a4beb21ff95b409e1b0d0488519831e8d5da48a4 +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b160d9fa5ba000b599a82f5a393745ae2c7b7292 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a4348bfe36a6b17c9676bab7f379e2199da04059f81b5ae195b62660d52be1e +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6cb98d63ecf35d7b248a48280b3ea086e035e2c --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df60b16ff7ab8ec0b05140b5b2728c2bd3dcf5b0063b9e8c46912435729c58f6 +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c109d79f81e246696cecc41dd14c293630fad2b6 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1b6dbf1c5ab71f5a90a36a9f790a7e72ff7e768071ce20c7dbddfadfe342c9c +size 199058658 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..734835b6343d75064b41b072cc629aa8913e70bd --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eefefb9f648ba763d47a448cccade70b3340fca8d7ed31eba4b61636a5d8684e +size 199058839 diff --git a/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca82fa225d29be33e2b04fbf86d71a3aacd9d626 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e18e5b40427b6a21929f55e9de29158a5ff524da02cc173003366d307edcc1d +size 199058839 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_01-model_00-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7660c0bca40d537c8b1fe854838e4b7b5dd94a84 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58af4222d2f3f430576b289210406f21ef7aa3036cf1caf06834dde646f874ea +size 167511299 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_01-model_01-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_01-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbf2650da471687575d0603352539d186ba9f871 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_01-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bf188b8d447d979be852dd2c9652a5dc219151e93e43aadb5638b77c8411e04 +size 167511299 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_03-model_00-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d78793ef6889119ad3213d4459f9ff4f8257e9fa --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e24d0269ea54b74b3871e4c5634dcd09f9b825d32d466130e2e692384e9d329 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_03-model_01-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_03-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7b642ed8190ee8a1e91a3d5481fc5d88ec88dfb --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_03-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f40cadbac34f391b923e099b1af3ecffc434626097af01d168e91720ed0b754 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_04-model_00-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..84c1a8a46bfe3eb08d3dc672ea09ef17e6084d1d --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:802f4d6cba9aa9b74009146138ea57e081bf5725c97953df48bcfc4e24fac0ca +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_04-model_01-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_04-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4982e07b8f586724fcbe53d4a379c4d749d6d9f --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_04-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6535237b2139e98aad7eaef3db833f72d8d5adb2918b94cdae0c6779824c3ef3 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_05-model_00-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5be5bd1ed76a74991f8560f645f5c332afdded72 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:463aa5b5a1a2ab7889c177d21bf9dadba4cf393cfbe37e6be01a6c5e83bf5e41 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_05-model_01-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_05-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f2d55bf7e08799aa4ce8524e5a21e5750e7df0a --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_05-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:657b44563f93bc52a8ba2d6830ba587d30d44d9153267c94d3e4d03f1c6c9710 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_06-model_00-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..81f65b53795e2dd1160eb15b7a1056bf400cc9e0 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59d7b6a5c4640862af5d1b1c313ab262e5600641429978ba0748917567492a89 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_06-model_01-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_06-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c09e203312ded4632036869da80396876b7a1e2f --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_06-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab9938b7e0c3e5a1551fdd3d0675f08530ab8d9757de58e07d2cf63449cf13b5 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_07-model_00-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b301c127fe41ab6a2a5273a1196c220f119d7ccc --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50ca0c9ff4252caed845c7c41d05f939b7a9e0a8a40baccdf4a85205e4e53b4a +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_07-model_01-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_07-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..780522ff6178064273082054d91fce6474c1d3f8 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_07-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ff1fc8587041cb41ff83607c78e0141f744d3e907cab098e228cca019f2fcbf +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_08-model_00-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..02e6c4de66aa3ab7de4b1f250f47811f6559ab74 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9921c15ab4f8173cd902f90520d93628cc70687b774497bd1fb338d128632a20 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_08-model_01-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_08-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2e114f976ee70b366a7baedc6a9c87bd806a706 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_08-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c79f1d07a16c78cb48021ad51d453105609dae4212f6cec94451308cb320a1d6 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_09-model_00-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f442ac1f0dc3c33cf37711b5c1d7dac2caac80f3 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2da559c3817d3f6313783b078cd8e7b8e16ff0b60b6c02685a69b79b234cb5ea +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_09-model_01-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_09-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..148fe516bc64b5cc83bea8079753ea8bfa823fe8 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_09-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18048989895e5d9bf8f339ba209038acdf291644d3f02b4ef48cca71773e3fce +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_10-model_00-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f55a3160efb07a9ab3ddcee7f163636ee70aea42 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e987e0b9a60ade0c0e51b73e7e06c6a8451717ce46e43dc51a354e626e9e2f86 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_10-model_01-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_10-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6853754fa3cbd5b74422bddfca1ca7050e433229 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_10-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31cb53887ccf7c1d362abab9dbe99673b966183b5267580a886c338c34120361 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_11-model_00-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ce3d551f339ea3a22f8c1de948347f602994574 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffa47d3c8ecf47818e39ec94836b09ab109512b4d4189260602e6bb2e7231a84 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_11-model_01-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_11-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f4ed76577d8063d7310145cc387c97cd96e8a36 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_11-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ae331cacf5d29fdc7b3c79af6030b1490ad6f25a065730b8e84dcf84ba2cbd8 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_12-model_00-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2ae2d332db73085d65bb7f5d4d94130ca56efb7 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1681d707456ed94d6bf1e3667ebe0db969f5247cf9cf7811bd781d294432cee +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_12-model_01-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_12-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb33ff1695e05ab50021bdffaa772e5a036500be --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_12-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17d3042629e0b7ca19a1d45df9968c538b3ef6a3cceca0f30523e80f6481405e +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_13-model_00-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c73e67ea653149d53bf4f7a81bbd3ee6211428e3 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6369f6b4443f7a35facc0df8b5e15aea20f6c1a658281ceb3e08ea32082a0f1 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_13-model_01-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_13-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..96f909405078c4489977d4bc3699875de72b4b87 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_13-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:104f75b5a26e4269e02af954593c8f2d273501c4bcd1f9e8b0ec375a0427fd4b +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_14-model_00-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4aec5ba7f59e1d025bf4febdfd1e63af89af6dfc --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8539a24ceca1724b5eeb19e1e42cca6b9b1729f1c11f3ee0680f28e85ead7eb1 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_14-model_01-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_14-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..709720e0f26ea0180ca2539fd90d9bca3a42a5a0 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_14-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d1bef8fd89ab55930dc27263563195425d35d0f015c837613645f10e0455ebf +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_15-model_00-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea0713a276429093a53535735b9feec6080f22a2 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e3d537165cac9a795a76f96cb51ef4bbe23e9108b5e9384027c58a8a50f98c1 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_15-model_01-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_15-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..13ca3cde7e4475edd5b2d0a083f4fb8920b5d4c8 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_15-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6396cf5c28a03f6fabbbb55cc49390f847afb157684484cfd88aa8a148c5f91c +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_16-model_00-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..34e211d6d82c00bdd977fb12f4cd9cfc993f4736 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d00371a5f3ad2f757ec7e09b7d9b51c0779c60f6d310261f7a1fe572a1df1d1f +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_16-model_01-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_16-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ab0d176aa1488a225aa25f598bbb5773b9b90db --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_16-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2829ec8f3abc3095da939c2eb182c087a42b4d9b6e21139200700c9bbd416653 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_17-model_00-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8de48d129fa31652c5bffde21a7461e0eeb7e586 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0e5d17df1ae4b6316e342c907d3bc46361d62e79e910da044ab40919e7e1ecf +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_17-model_01-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_17-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..93cd7a0cf9562e57bf3e92e2ab173f00fae9b3d2 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_17-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8259dd7093eedbcc03be2d6322ef0824db6fac119d3a357b3311946a0a35373c +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_18-model_00-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..47e4974c1771d28ae5c1bfbd85556e0b96ae5e48 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b63a8e8e3ca16c7ebb1854d7fb408d24c9b132641fd40d84f1c73f8ddda4cf34 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_18-model_01-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_18-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..698e1564ad916a0638d6282e564fdcca525d896c --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_18-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:443861cee94df9d7903d5e6b84c0392e7e22f6550b5982294f3c0ae2e0d7580d +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_19-model_00-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a3f041cf32922d2835338cea674f22fcd58c6ea --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64ef9cc75b028e6d2fc4c127f95d5c6c170d4937e2c8935381a1c98ccd3e8bd5 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_19-model_01-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_19-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d31d22e6efdea710b183cb3c4e000b9936625c2c --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_19-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb172f2f3fdd2f5358590644c4aaf997fabb3d49d1fc3f778287750e4eda110c +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_20-model_00-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5915f3042f70fdc970e6bd96b1ce934a646278c --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:284db34ff6c6aa283582e940827c396d774d1257e557d395ce388be2cdb7abed +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_20-model_01-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_20-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dbc6d4289c533c9b3b12918d9f9eb37e1f7f34b2 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_20-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a28d32c1889c1fd32a353400b711b105a2cd42f7671f0f37aeac7e6930fe60c5 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_21-model_00-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e0c23546ad39719803aba05fae08877f2a2a622 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:717117b49ef593fcee11c5b56361100a77305137c8e73afb39d7b2e0cfa471b2 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_21-model_01-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_21-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9915807a203a98438fb7369a878aad2ef99b9fdf --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_21-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c740d6a72c55f1bcff98bc2c10d893e9ba1b40f23ee88eb949fa94e4fa1e13f +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_22-model_00-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d89d30b3f937412047c3b5979fb72226b5122a3a --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64f4a5884086a7ed0ddf93d8676686b588db8db1af0e20f9c1a3c0f95079f064 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_22-model_01-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_22-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9655870a7671929dc8977861b4d6c43b3f7b2a0c --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_22-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:beeacab8110a9aecef44bcc8b030a73b60e615649516e8a1e16713ee2ac893b1 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_23-model_00-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ae3b7802811876f8829a6838a221d7a0504f2f9 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c4c45d4f60ad1c0ed38f9f4b31fc42379c325a3f30b40749d0c6b674db82989 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_23-model_01-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_23-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..07920a180c76af513250dfb884f3783623c3ae04 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_23-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dd72005988e0d38dd94128d2e2bd944566ab16d917331273f8b0dd98a9cf34e +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_24-model_00-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5763378457eaec258f380513436823ae53344b0d --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4e11875686675c7d40ded36510e81f4d1c57a047c08832c9f2502d81c06f355 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_24-model_01-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_24-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..43a5697b050bf6e2e7b8156b2c5f64230704ed36 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_24-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fc4869c05e532611de1ea58265f127d8025d49a2bc3b9bd18ee1b4b34328ab2 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_25-model_00-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2bf83ac1e124014fae5c144e940995e2b3047b76 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:632cca4b4fa1580f7bf4904026113750da0cb649cef85087a07b19ba84847110 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_25-model_01-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_25-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b51874b952e1520e7bbbcb8ba3b55a6b9a77b38 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_25-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:265925ecec6d3e08389a257e98f2b2aeef14ab2eb31d59efcb612eb9f6ab5367 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_26-model_00-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..65a16d146f94fa7af1647377c7ed3bf96fce23e0 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d6914829fa2ce3e2d469c5620412d16b117b49c9a3268f4627cf8d42c320fcd +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_26-model_01-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_26-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ccef733d7dda48a683a97def22806ba606722e9 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_26-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a3f580664d046d5454ce31deda99e4f9bbcb7910303f2d26c151d8073cc40aa +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_27-model_00-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5475fffedbf7e7dc193479e6b7a86b7f21b20f92 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90e7f1c3012c614129698bc564fb1388de240a5dfbcd70969434712859a7b5b0 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_27-model_01-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_27-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cde0bf46da4f3fe47042421ccbb9c0333ce166bb --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_27-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2c3354b1c503a2c3751c2b0a2305d21dca0a85b8b988bfc841e9fad62644ffb +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_28-model_00-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2721c116a13d0b3ade90843636cc610bb96e9e8 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:407347dcd5944aebafbfa362ce40b62f1326e0acb2acab4673e070d79be8f16a +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_28-model_01-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_28-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..55775ac2badaec4b7ebeb323635daa641072eaf2 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_28-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf0bed0ce78f7a8be53cbcdac2160cfc78957055706ed76afd9b914eeb003f59 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_29-model_00-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_29-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..60498c8a63540a0b88f095833473e8c42c1f383c --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_29-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83ce7679630d88289b52564fefc8d5325d2bd64778c5b30a151c2b2b0e0135a3 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_29-model_01-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_29-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9eb65ffbcdb094077100e860a41fd2689ea1bd7 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_29-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fff9a4af91e7b6b8015afeb9b3cdb59d4ef9267481f4894c182c0510627e861 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_30-model_00-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..819105da213747756f98fed50942ef0ed9ff9d72 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a11358e084466ab2e485972bfd4a6f3421bb3295d8f70b61f4d864cab788e3c +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_30-model_01-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_30-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4ab227e34782e931f2946e59d3cc48362c49978 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_30-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c37b18239ff50cc09758595e3ae8549e71e89c566332455c21f26bc4b617542 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_31-model_00-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_31-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e42ad0bc7e66241c908c7937d878a690b13b885 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_31-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54f9fe00dedfcb573d0c373c97bf34b60113176aac4ca2c6f67c4fb612ebe804 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_31-model_01-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_31-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aebfc5335b5265ad48ab22873de7e48b66243321 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_31-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e670d5ae53e1a8ad8dd4dcbe84058a2f137b59b582a47eea7a155d2fda472876 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_32-model_00-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_32-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fad98210d05d28ee390d6e7a1ac016b8659cd985 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_32-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60f18ac68d407ce34d0c4af5ec1cfff516dcf94a562054df31338b45bb5f5207 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_32-model_01-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_32-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd8e0017b6bcccfb90d2a71bf27061043067f0c7 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_32-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bd935c19c405a6fe9a2ceb2b32b1ca39053df1969bcf5e3fff53a909af9a876 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_33-model_00-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_33-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e8abb955fb3badd382cd1b727f7f9e1bc829bd5 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_33-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dffd8c52106af58eada079666f551c56915be0bac49cd5e711d9791f611b2fce +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_33-model_01-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_33-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..07c55ef3ef6cf5f4005f5d20869cb8a53721b3d9 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_33-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22264581a6c73db9234eb1fce8ccd8115bf206e5214057c10d33a71986a42085 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_34-model_00-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_34-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b100e682e5911fd2652a77a4c42f41455d7f66c --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_34-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da7014f80efb076572bea824ee1e53dd3af24ef9b647cb69f64d77327f1b5e27 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_34-model_01-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_34-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd1cbdd8aff7ba4426476f9da2ca83d925327d2b --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_34-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33f1632df0706a9ef8bf573c873d4d90ef640664ae6525765b876a47b1a608e3 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_35-model_00-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_35-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c05daf7d1c8236855daaddbd2553aa1d57e817a5 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_35-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd1ff09c41045d2412d260ff77dd0ffdebe276dba6d21e3040b65a919bc4456b +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_35-model_01-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_35-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eee703707a34df5b23e30940b1ef5a6d544f284c --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_35-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e6f4085f50b927c44038ba4f0dbb4e0a58668728fbc4d1d507311ad85b5fad1 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_36-model_00-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_36-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4597920ff398b55aa0a6c4f5ca0cb9c9bbfd91c6 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_36-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab8c48e8426734c594105f6a9683d5e3918f9c82ef85f0a1dbf2fd957eba0614 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_36-model_01-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_36-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de94993244ea6c1098c48ef44c9fb365f463744f --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_36-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3fc259c24d08c5cd8fe82ee4c9348faddc9a0d37951d2fe76a1a199d6999e2c +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_37-model_00-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_37-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2df6b3625cd6d7a37b04582d45eb55fcedfe241 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_37-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34ec4c2a88625264e7138592598aadd4f4c05f868e50b872695e71eb96401bb5 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_37-model_01-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_37-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..805876a41362825593c1609f09fc374eb2f8d4b3 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_37-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b60c9e2580ae0885a22abffa5e5247bee84d59ef788784e82252cfb21219cdb7 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_38-model_00-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_38-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4589e3ba8226be8756868e4c84cc0f0411511e3 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_38-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39d81cfe43102c494c79777b87236482c5551eb69260eabfe2331ad6e00b572e +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_38-model_01-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_38-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f8dc1f627e3a28496cdaa5bd4e697035ef01511 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_38-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fce62f6f897420f708e94394f5fc32c5cc1f80cf8b39acf22281716c9c6b916 +size 113308931 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_40-model_00-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_40-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6debd0367e430307ab86bb9916109811b8d9a8a --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_40-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91d017694560e665b3fc314c6855984a4825f594b556752b7f38329ec8a1e380 +size 13507 diff --git a/4b284b84bc4v2seed3/global_step80108/layer_40-model_01-model_states.pt b/4b284b84bc4v2seed3/global_step80108/layer_40-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7657f130cbae1d8eb667045f192bf7bc77301367 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/layer_40-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c03cf4a6c4567669fc26c65a9099000ce9fc7dc3cc146e3cb2b042f4cf1f2bd8 +size 13507 diff --git a/4b284b84bc4v2seed3/global_step80108/mp_rank_00_model_states.pt b/4b284b84bc4v2seed3/global_step80108/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..01914057f81e891afee06bcd1f448e7760c63548 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:114ff88e400838230d7b647ad21231885fac245b2c2a2f1e9197aa549dce99ec +size 51507 diff --git a/4b284b84bc4v2seed3/global_step80108/mp_rank_01_model_states.pt b/4b284b84bc4v2seed3/global_step80108/mp_rank_01_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b7ec5a7c24d84b5a59b79c9de4a6f15c84cb9e4 --- /dev/null +++ b/4b284b84bc4v2seed3/global_step80108/mp_rank_01_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a22e0c588abab32a0c92268cf50ec370140a4c298593cfa674af9c8765f9610 +size 51507 diff --git a/4b284b84bc4v2seed3/transformers/config.json b/4b284b84bc4v2seed3/transformers/config.json new file mode 100644 index 0000000000000000000000000000000000000000..df814c3a71ee49044410636b5eeb4f43611690ba --- /dev/null +++ b/4b284b84bc4v2seed3/transformers/config.json @@ -0,0 +1 @@ +{"vocab_size": 50432, "n_positions": 2048, "n_embd": 3072, "n_layer": 36, "n_head": 24, "n_inner": 12288, "activation_function": "gelu", "resid_pdrop": 0.1, "embd_pdrop": 0.1, "attn_pdrop": 0.1, "layer_norm_epsilon": 1e-05, "initializer_range": 0.02, "summary_type": "cls_index", "summary_use_proj": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "scale_attn_weights": true, "use_cache": true, "scale_attn_by_inverse_layer_idx": false, "reorder_and_upcast_attn": false, "bos_token_id": 50256, "eos_token_id": 50256, "return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "tf_legacy_loss": false, "pruned_heads": {}, "tie_word_embeddings": true, "is_encoder_decoder": false, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "suppress_tokens": null, "begin_suppress_tokens": null, "architectures": ["GPT2LMHeadModel"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": null, "prefix": null, "pad_token_id": null, "sep_token_id": null, "decoder_start_token_id": null, "task_specific_params": null, "problem_type": null, "_name_or_path": "", "transformers_version": "4.25.0.dev0", "n_ctx": 1024, "gradient_checkpointing": false, "model_type": "gpt2"} \ No newline at end of file diff --git a/4b284b84bc4v2seed3/transformers/pytorch_model.bin b/4b284b84bc4v2seed3/transformers/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..d1521a3133f8e483e04501f07a0cb5762964386c --- /dev/null +++ b/4b284b84bc4v2seed3/transformers/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1c8653af69b7b8af39cce4bbb822514fd78276e7e755f5f99ec3543183c6b3c +size 8781203669 diff --git a/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..b75f6f9a4008bda759a62d4705dbe8f1cfee349b --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.34441376096478077, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03364738239161352}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07156437671140904, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0016916866568706518}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.29498663582371476, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0047504849601230975}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.10791921496577737, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002171402381627088}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03339629860790558, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010276756756951227}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.14089640762105182, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003169219645311096}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.0506136487550108, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0013544155568851314}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06867849616024986, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0015588261952769657}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.2865361097530141, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004609475551865619}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10397564759824128, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002024130402320653}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.06816360012566612, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001597766711115546}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.2811330280761629, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004465952639791254}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10284733675284609, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020471999326618765}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..3ec30a01075b4b1649b313e641c54b4496c389ba --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.4687199126816133, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.036800374006492664}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07570221536151728, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0014363865463457549}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.37281196342463774, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005425026995807581}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11753553291473576, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019140656759965315}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03517849994399333, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008874020071430252}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.18207060381703669, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003664740082406787}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.054731274015692305, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011992442792975787}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07143954952407837, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001305238902060498}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.35175875189308164, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0049642525171124975}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.11105152882900622, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017516497637055164}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07178061720744913, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0013540467985344866}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.35171330673154494, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004937137016938597}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11134944889691471, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001795094595999485}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..44e16169d94e0a0cfca6c3ce57b7ac6a13366efc --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.5235717824828133, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03767810577658163}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.0783700606217331, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0013622939044074152}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.39995054593345924, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0052804057805626164}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.12260704886786168, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018070929383927695}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03627187434475958, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008236125331839457}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.19905166470669564, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0038388111983134595}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05717657732704682, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001147470465886568}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07359908440403741, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001237832140736892}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.37356398478304126, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004770085055809505}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.11517678618925936, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016478650517612742}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07453785183849788, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0012849507538737566}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3794084560485554, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0049017847382029295}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.1165772048673089, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016980264714204242}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..fe89a84ba63436fed703f4c63badd1bbd2954cb9 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.5916343641542043, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04024225062945221}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07888158387802857, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0013905334633539245}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.4033319142330156, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005299089005220485}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.12387093846990074, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001885726927501542}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.0369653886039744, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008664032303747072}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.20236135540846556, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0038733010690355342}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.058284289461857604, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012101468635650288}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.073511276121497, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001251002353845416}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.37511361165748164, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004789107031378535}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.11544325899200131, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016990426527488723}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07497143356596919, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0013133945848135208}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3819932847239564, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004902385390105475}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11762103770674365, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017726486791392565}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..81473bf4a3c33449e459efe8bce3f5d80a85563f --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.584148826341706, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.032088259094079065}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07737100502750222, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0013014310515114744}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.4039418841652104, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00530796073731901}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.12197092014603778, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017607850151334767}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.035917415755917156, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008009838171179654}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.20296997665907882, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0038561197119444304}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05693950723216792, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011236415767176787}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07227090942349099, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001170080155549711}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.37605665528150317, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004782196417125406}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.11390315132939448, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015842511141082533}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07366718744107867, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001228472532147223}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3838102958885374, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004940246508662335}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11605708607515382, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001657698456603933}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..d3b388094f8713d3884886faa1f87a49c1f71204 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.643769416521065, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04327961614658416}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.0778714729225077, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0012716812804740509}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.4199879645762265, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00535881210434279}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.12362474434882809, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017387117939925156}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.036051220083070316, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.000777501535408198}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.21150748306290545, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0039302718094465635}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05758469671440457, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011051399672881632}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.0719478472042638, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011295516496439356}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.38653994641960504, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004712427125192832}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.11417482723461402, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015386798608318928}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.0737393959127114, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001196371537872998}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.39623787521806264, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004912468268398718}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.1169653954794077, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016283607844766808}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..0c0791a9393afa43fd5577d6ca42a05e94d8859f --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.1537922187888957, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018933213102104863}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.2625407961087503, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002682894905994936}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.1799962602325878, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.00184248350208152}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.030157104540943284, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007476727834062231}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.055001050533522555, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0014448444524840297}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.03586670200965267, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0008450513639399489}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.11780986849918428, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013162517308047393}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.20916963040579825, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002196518290796577}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.13967379634609953, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013162078681435803}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.14081205310262065, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0017218252583982084}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.2419875104700217, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002500846878935716}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.16507864218420232, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016765101940476469}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.5029930497312527, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.050686861917854}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..4c9cf039c07f4d98d6dae1e68e587becd421041e --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.18419539466594548, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.00216315844926582}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.30850131448570595, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002881646502827461}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.21295884672876816, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001991739006687224}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.044713693466448406, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.000968138913860097}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.07839796746781187, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0017417848523259565}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.051942458861991954, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010199515581882507}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.1326981808478002, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014579507711624912}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.23011492408104228, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.00229754097749749}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.15484936057383927, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001347730246639345}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.17205251851388254, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0020202953529773735}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.28974852616388547, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002737913509276009}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.1992303563413742, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018619630110637574}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.7242641167777077, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07938213037481555}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..28a1ac0946834362ce8d47d751f1856b9b1ad2dc --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.1997095751146021, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002703732640041402}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.2883485784255837, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002841589718801568}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.20703905721090818, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001929567362026057}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.052135221349108814, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0014902691345396325}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.07402543775497225, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001656124634067446}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.051520411225961356, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001031129051354628}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.1503544839184264, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002191707211555614}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.21866995964876715, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022872119612051362}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.15441401199805835, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013920098120515118}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.18828746764086687, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002574176036533358}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.27233360792883826, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027083132609021184}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.1949510570568441, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001804660306034504}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.86942295772908, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08758910211106738}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..56dde72d969be98c205ca085a0ac89b3483bdde7 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.19702312634415606, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0035795334816332027}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.22825422304548265, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003232347523636064}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.17391868610816388, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002277407569748311}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.05667983844146617, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002120538883847141}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.059228247136442105, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0015413764801780459}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.04463749924381735, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010686000964725524}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.15076982480282128, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0030098254531581766}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.17209850822866807, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0025209050965990243}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.12950729491278481, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.00167294588483517}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.1860026881384513, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003405588840643614}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.21613806050396925, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0030779584306118175}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.1642422006919473, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002147002697595944}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 3.0330716712469843, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09425863264675978}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..07ae3648d332ded38b3f2b56b7ab59f545f1cb7a --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.06862907083042237, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0029137045746235116}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.07213602119470613, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002675324630242608}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.05441509889844838, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001922155872957772}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.019800771477798358, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0014215056199837948}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.019407609285097115, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0011737580125973422}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.014130696002074776, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0007469700039793996}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.054030861033230786, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002428473990666629}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.055369844370012286, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0020897273452589395}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.04132917986525425, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001453754043869357}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.06581471030428865, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0028148588567455577}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.06855419478068313, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002540543323104449}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.051839091609912694, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.00182789753930337}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 0.4039582112595248, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03484552558450677}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..c3bcd49760356c9806cf2e685079196aa1bfee83 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.010184074003326236, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001185280919251267}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.010530222683810939, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0010849872451804167}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.008187248278912505, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0008215139146136158}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.003045190089865129, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.000629256262446744}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.0025316582919952747, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00035954782149502667}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.0020440057618351945, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0002894852867481284}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.00801661098513702, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0009926654487693505}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.007789272405875561, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0008037973390293996}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.006141492653296614, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.000619473069682991}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.009784563527498156, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0011539456656877766}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.009966706597956685, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.001029454113884746}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.007792108172262034, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0007861479859061975}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.0014137810446263e-08, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 5.022609361040328e-08}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..aa082103c70239b388eb4d33170bf651b084ef90 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 0.1668198320527802, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.01897983257333898}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.030286876271392194, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001036156882791465}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.027143500611213456, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0007465539304065285}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.022506347386715704, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0005868062207608241}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.0011223500556642703, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0002013011694364979}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.0015238484363635906, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00022622383493949605}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.0010842906651617643, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0001636612072099844}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.029891451434790904, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0010048119314992631}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.027040559559811043, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0007436210949765598}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.022348380076958108, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0005776004107689916}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.02960870450534663, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0010175867142908736}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.025998503793795025, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0006867190478188373}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.02171066987180087, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0005513649905399339}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..55d234f6a889962e3888982e7d65fd30876801aa --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 11.497789088857585, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1207333221383202}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5193372726053079, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0032827860366154518}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4187417243003722, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0029601462557396806}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.437040451945744, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002333774145212166}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.24404637097851045, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0025862116613527076}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.1933021952228981, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002111531045223336}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.20198550157867662, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0019395848816704526}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.3793149671052253, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0028788724723207175}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.303084323993645, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0023997981815417927}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.31702593617702457, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020123220115816466}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.424766622860286, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0031065633020390844}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.34158689328494163, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027234093565780253}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3567272344346471, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002273204999670106}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..53b6b96ab9633689c2740afcdab7af97134b2aa7 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 13.232352061213327, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.18438572640282935}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5438295687735817, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0032626249125624544}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4519156735724399, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028471232903033885}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.46686827804183195, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0021857893913537927}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2677592832314449, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002678442807946661}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.21857181845743923, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0021530696594196743}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.22608889723213235, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001981518091728108}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.3988680585181114, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0029405304248634437}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3293160518559301, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002411675944122487}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.34083378350431404, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020309168195614307}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.44900069330118875, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0031269512646810997}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3728742942560764, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002675120241181924}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.38531835059376945, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022236074600925494}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..f3cce36077822986a456ad6535740c87c6e127cb --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 14.1599321841023, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1879116618302546}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5316343436240858, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0032625643740183926}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4648983433320942, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002828266123213244}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4695262322349431, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.00215490562453037}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.26457242284963084, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0026154624845308966}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2286713763984792, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002213558974457314}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.23062310394414082, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0019690665088102194}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.3891085104737073, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0029515533104354013}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3385179926519356, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002447035400467983}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3421096115443624, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020310235455138293}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.44153945634327574, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003131733329038247}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3859861563616844, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027050660850819557}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3897046712016254, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022104074028312126}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..435c21a3e5f146fef1c6967f7302af340eeb07a9 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 14.215875217167579, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.19854834212398645}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5190910100984744, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003294663292154946}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.47129632991643877, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002752331164331658}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.46760558865318314, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0021274829390602406}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2607371623810947, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0026626721914091273}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.23271303570323362, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002186914450625737}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.23112566064185652, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001973386702544114}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.37743317581253305, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002922501161012456}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3421754841859648, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002448897823883138}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.33922485306684963, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020379531080847698}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.43332497676504134, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0031201843719093183}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.39450016226821116, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002683555554853958}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.39088870724203995, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022061435555151025}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..1b06c34a846c69ace3333aeef46fd120f64cd280 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 13.675372357471726, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1772679235890945}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5079146856634101, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003244631875951903}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4750602535272041, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002707456752563758}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4652741436608286, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0020856290234426084}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2506185278912072, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0025688729450509744}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.23020274907523836, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0021319283224229416}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.22596116871891767, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0019272220902171223}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.3646830222320307, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002836137970051408}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.34124704138322626, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002433024945476074}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3336418614264682, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020082018536239574}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.42108375995240394, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003034856921594324}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3952453063898795, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0026571910552197976}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.38639018088252236, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0021588490021418913}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_0.json b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..eaeb51297bd78a4c24f8b2a67fb9535f3c73931c --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.17780010896090837, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0028657687702784394}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.33168127958194993, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0043909919411222464}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.2181226869116415, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0027581474749694035}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.03931279207892139, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0016581578355807393}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.07619599508022841, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00272241500352495}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.048528921002958546, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0017764487817816764}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.13228242420416667, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0023035178337467654}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.24740150573619668, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003505699991405706}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.16205491808395142, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002184657948901955}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.13792549177526942, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002344912834751097}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.26116272332322926, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0038687142611478474}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.16995115866612748, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0023209836007670715}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.9965727451782298, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.15826205801047227}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_1.json b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..63713ce20362cb8c4dc03bd2d608d6d7f60c6294 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.12623297679712753, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.00185031477682142}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.31355314687479174, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004381874835308543}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.17785826511919287, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002506168575309281}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.02671739102876372, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010147304084239857}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06963018507899452, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002768236684178756}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.03812763380493433, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014499362846337098}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.0989142119051423, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013791496324926688}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.24757016935280626, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0034520987132384117}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.13961978647843165, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018876284466631298}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.10042944590263467, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0015100489954681905}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2518445443289288, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003780328500383181}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.1418358500050043, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020742150121420516}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.521961099148944, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1067162997839333}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_2.json b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..94ab07d402fd4c64c1ec3b0fa0bab69d6d67caaa --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.12776888363608563, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018271531287357235}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.31621003695806416, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004292592593741099}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.17992305299553213, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002471474032703446}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.02713599956564803, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010066515368428789}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.07048237066918879, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0027207468576705084}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.038746331277995295, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001439750042341812}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.10123566070632635, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013895764877661831}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.2528390510389675, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003483747346972295}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.14290468633219328, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019087949950632504}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.10104760152172992, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014792769919128913}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2530463368650048, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0037161332717751}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.14276376154853065, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002040901548342001}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.5280857149419538, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07885108475340596}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_3.json b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..a570591658a647a68d5326c4f1a687dbf94b8cf9 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.12121822408668065, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0020739133661264075}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.287891057927081, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004579134322254905}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.16685520709327625, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002665570155443094}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.024946562796427662, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010295220175533656}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.062229435333035196, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0027102677143777706}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.03502142308268661, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001453833565879767}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.09584883568666924, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0016019599062301714}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.22935087983395927, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003723896150091747}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.13219464959176125, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002089625494358884}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.09677327103730465, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0016860407775182488}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.23249987999606497, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003931934403157173}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.13360679199458778, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022032590659256113}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.521537278708307, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1340390241992026}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_4.json b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..048bcc9d882a06172b2d660f3471905408f3246e --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.038078096723767996, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0023781047408131164}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.07110840872162687, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0041655460986093325}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.04534730746066439, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002611229049263828}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.00755130939213845, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009407309816817791}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.01456763376419491, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0015059193465168199}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.009137318621937963, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009714552620996167}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.030895255217096195, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002026498228282476}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.05673417944538178, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0033250538537188097}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.036178777224856525, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020901567682781942}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.03193887181863606, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002103908155038245}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.05872079534060702, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0034877968907706214}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.03747044675977351, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002195978615372179}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.629879023989858, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.12544962320083983}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_5.json b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..3fccf9c899679e060f44d81daf89c1d7f6b12eaf --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/agg.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.0028153785061314713, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0008109014775672004}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.0022397022323243287, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0005923742999126791}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.0024480546534426002, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0006663143862102796}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.00032960010762452495, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0001942158416689748}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.00021523288032721994, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00011457292554383501}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.00025593065551168283, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00014085048380669117}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.0021686356526300445, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0006433045803199352}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.00171133818409571, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0004578910681243736}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.0018728301034077845, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0005184193716142723}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.0024191989997527706, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0007056629627390068}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.0019291072387565224, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0005158196897264791}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.0021046719353290323, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0005793875805849997}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 8.029951400668467e-38, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 8.999389473215882e-33}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_0.jsonl b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..9f8bd98ffdd31f9a060ca865b02329e543a397da --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe6b504b1aed581b7359a89f7df3479cde053d0c716478f6202ebde4485e7a2d +size 4145814 diff --git a/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_1.jsonl b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..be575995d9b9fdefbabdfb532b010c08db442f26 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a779a5f0bb47b43d3b5b2c671e75badecaef316faafae4fef46ffd299d75efe +size 5102219 diff --git a/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_2.jsonl b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..21ea860c27a77f25cec8be51361a922ad5d6930d --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a042231cd7e5ce1ca3dc512a02d044c25be3ad57d7c5bac576f5d71919c5bd72 +size 6011533 diff --git a/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_3.jsonl b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..d2e1223c17f49eaf016d5bf525dae76da4577171 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ec0a3ae942a50a9046f7af686ef8270c2ba819fb0f42b9ab76c182e37352e67 +size 6921897 diff --git a/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_4.jsonl b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..774f828e885762cdf6d50389a68e816160652797 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9658f943e319a09967387fcc6bc2a95347c91db2e9cef15785cc58f7c1eabbf2 +size 7825017 diff --git a/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_5.jsonl b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..d29e18f3d11c16807adf63766ca26a9b20e2b6b5 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abd7776ca4f0eeb3d0f83ea2b20278ed5dc41661a30bb82270d7bc7927dbcaae +size 8740347 diff --git a/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_0.jsonl b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..92d5179b110ca18d617642f4a0076bf68e72621d --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43808f175b319fc2d9bdc7c9f18b0efe3584621bbfc0e690b958f2a10c187491 +size 7704969 diff --git a/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_1.jsonl b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..96f1eb6854ceb24373d1765ce2b0ce077d64aacf --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f696ba3501a2871e37a9dab0d49b1162d94b9863ca904ebf0697699921855e2 +size 13306769 diff --git a/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_2.jsonl b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..b138cab2ad1b460f3ed159db08196cbf2b03ffe5 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc78b754d38301c9495e633a5499b44bd80876e54a68b9a495a8e2c6642db7c4 +size 18861520 diff --git a/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_3.jsonl b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5670483c67478eb676310cc632d02ae2a4aa9844 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:074204321fcc0c272f06452c35b2f55633f5afd2bcd89aa6de3c705378929328 +size 24239623 diff --git a/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_4.jsonl b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c8fd5cd970baa74fde1463806ba7da18f30063fc --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e144b1531b6523c24b219800f2f55ae6927b26ecb495516f125f11c1b7354583 +size 29432473 diff --git a/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_5.jsonl b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..fda5d99ea1ad2bc063459c88f6d27488fc5800f0 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2150a7f47da2071041b3c0d25d8e265c1e0121fbeeac9c8bbe54e14ff168911b +size 34792612 diff --git a/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c62bfcc071e13bd5c4c0038950313df9f95b0b40 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9516338670e087d9c6702c7b714e65ad293234af1f959f3a78583b61e38037cb +size 4365398 diff --git a/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e55d89c3be95a7defad264445e2bf674361e3ceb --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9267aedac0ed8aeb4d1b811bedbfff708bffddc2563d9f0a507a72389c0b2d79 +size 5043673 diff --git a/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..4a3566092e1f102d8b810150739f8f2c4527cbba --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08d72193df4003781761593b1483d354f645df6f3d4e81384a4cf0b1e37de4c6 +size 6137381 diff --git a/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..a5174e139a3ed3f1acbadcf8c8c09d14d535d32b --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26194dec6a6546e53457244dac07588b7ba62b0f2a8fafe3f20159ca7098ce30 +size 7239405 diff --git a/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..1c91820601cc70d39f0387d4b777443c6e0a642f --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c609162e37413eb86e352582265f9c623f82c02f6ca281b87b2b6567b0f57226 +size 8334937 diff --git a/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..15126edcf8d846ac3562130d9184e717c789d9ca --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0441cdcb4284e27c1ce3295cdaecbfb9d7ca5d7cf11220072ae2cc9fa07908ed +size 9435400 diff --git a/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_0.jsonl b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..112201e20db119cd49dd3c6ba434a1c63c7a0fb9 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:caa1ddcd4db8bde6c277abd61aa8e3c1287a1e35fa15a1cf0d6e7789ed67b353 +size 2782096 diff --git a/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_1.jsonl b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..d9053ff0b6f9d81403ee67aee10981d3a3f56d47 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f4e6b88a7d72ff92f0fe408ce892606c980a0c1a71761b04da2f00e7254a840 +size 5103928 diff --git a/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_2.jsonl b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..d0c0d76d6bccd187a98fd529a78c02e4aeed1b99 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e96415082697bd67d0a5416df56e8003e2dee83f6bf3e6e45f92d76b4c7ba472 +size 7378509 diff --git a/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_3.jsonl b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..4155740db44c0b35c676e8faaa39d1c201335ab5 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd45c1b6f1134c19b4a786790db22ce43fdb999cf6b0d7be8637c163dadf69ca +size 9645995 diff --git a/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_4.jsonl b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..b2e86548fc497936ae72aef4635f4af6014a97a2 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df4fe4723179afa4ef6aa0abbd54b6dc508752c2dcb9059d831a172d767b1daf +size 11671727 diff --git a/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_5.jsonl b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..1196f29ca504467da485a2b4f62014a54d44381e --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/examples.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b92a20a08fe6eb186f75ffb584b1a4200820fc802505fbc9fd3b3e7647f1a34e +size 13897507 diff --git a/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..f75197ee148ca87446d7f59e97d384cdcb4d769f --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.34441376096478077, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03364738239161352 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07156437671140904, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0016916866568706518 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.29498663582371476, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0047504849601230975 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.10791921496577737, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.002171402381627088 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03339629860790558, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0010276756756951227 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.14089640762105182, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003169219645311096 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.0506136487550108, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0013544155568851314 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06867849616024986, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0015588261952769657 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.2865361097530141, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004609475551865619 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10397564759824128, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.002024130402320653 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.06816360012566612, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001597766711115546 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.2811330280761629, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004465952639791254 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10284733675284609, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0020471999326618765 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..8eb53790df89201860eed5aca8dbeb6ad5f27697 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.4687199126816133, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.036800374006492664 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07570221536151728, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0014363865463457549 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.37281196342463774, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005425026995807581 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11753553291473576, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0019140656759965315 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03517849994399333, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008874020071430252 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.18207060381703669, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003664740082406787 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.054731274015692305, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011992442792975787 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07143954952407837, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001305238902060498 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.35175875189308164, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0049642525171124975 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.11105152882900622, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0017516497637055164 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07178061720744913, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0013540467985344866 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.35171330673154494, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004937137016938597 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11134944889691471, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001795094595999485 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..37feea55fc061fd5b601018ee230c124e89238fa --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.5235717824828133, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03767810577658163 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.0783700606217331, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0013622939044074152 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.39995054593345924, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0052804057805626164 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.12260704886786168, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018070929383927695 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03627187434475958, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008236125331839457 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.19905166470669564, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0038388111983134595 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05717657732704682, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001147470465886568 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07359908440403741, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001237832140736892 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.37356398478304126, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004770085055809505 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.11517678618925936, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0016478650517612742 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07453785183849788, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0012849507538737566 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3794084560485554, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0049017847382029295 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.1165772048673089, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016980264714204242 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..ab60cec36dbd26fc621b4e179b6a2094928e4a33 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.5916343641542043, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04024225062945221 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07888158387802857, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0013905334633539245 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.4033319142330156, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005299089005220485 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.12387093846990074, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001885726927501542 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.0369653886039744, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008664032303747072 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.20236135540846556, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0038733010690355342 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.058284289461857604, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012101468635650288 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.073511276121497, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001251002353845416 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.37511361165748164, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004789107031378535 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.11544325899200131, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0016990426527488723 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07497143356596919, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0013133945848135208 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3819932847239564, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004902385390105475 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11762103770674365, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017726486791392565 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..b5ac7f6978734af473b7eefb6f009accbca82e7f --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.584148826341706, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.032088259094079065 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07737100502750222, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0013014310515114744 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.4039418841652104, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.00530796073731901 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.12197092014603778, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017607850151334767 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.035917415755917156, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008009838171179654 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.20296997665907882, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0038561197119444304 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05693950723216792, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011236415767176787 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07227090942349099, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001170080155549711 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.37605665528150317, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004782196417125406 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.11390315132939448, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015842511141082533 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07366718744107867, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001228472532147223 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3838102958885374, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004940246508662335 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11605708607515382, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001657698456603933 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..beb8c4b2a9f4dc772d8672b71e25b9e9b20ae06f --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.643769416521065, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04327961614658416 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.0778714729225077, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0012716812804740509 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.4199879645762265, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.00535881210434279 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.12362474434882809, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017387117939925156 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.036051220083070316, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.000777501535408198 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.21150748306290545, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0039302718094465635 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05758469671440457, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011051399672881632 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.0719478472042638, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0011295516496439356 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.38653994641960504, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004712427125192832 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.11417482723461402, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015386798608318928 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.0737393959127114, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001196371537872998 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.39623787521806264, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004912468268398718 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.1169653954794077, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016283607844766808 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..56ad3449895d0a7c7700c53a0c6213564618b406 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.1537922187888957, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0018933213102104863 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.2625407961087503, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002682894905994936 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.1799962602325878, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.00184248350208152 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.030157104540943284, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007476727834062231 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.055001050533522555, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0014448444524840297 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.03586670200965267, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0008450513639399489 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.11780986849918428, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0013162517308047393 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.20916963040579825, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002196518290796577 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.13967379634609953, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0013162078681435803 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.14081205310262065, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0017218252583982084 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.2419875104700217, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002500846878935716 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.16507864218420232, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016765101940476469 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.5029930497312527, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.050686861917854 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..6923ba514b8eab455c5f1bb6391f9ebadce756da --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.18419539466594548, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.00216315844926582 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.30850131448570595, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002881646502827461 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.21295884672876816, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001991739006687224 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.044713693466448406, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.000968138913860097 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.07839796746781187, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0017417848523259565 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.051942458861991954, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010199515581882507 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.1326981808478002, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0014579507711624912 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.23011492408104228, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.00229754097749749 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.15484936057383927, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001347730246639345 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.17205251851388254, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0020202953529773735 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.28974852616388547, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002737913509276009 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.1992303563413742, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018619630110637574 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.7242641167777077, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.07938213037481555 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..ea281c7ac59cdd7f89f3562afcc2cb4c30985ffd --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.1997095751146021, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.002703732640041402 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.2883485784255837, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002841589718801568 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.20703905721090818, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001929567362026057 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.052135221349108814, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0014902691345396325 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.07402543775497225, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.001656124634067446 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.051520411225961356, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001031129051354628 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.1503544839184264, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.002191707211555614 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.21866995964876715, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0022872119612051362 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.15441401199805835, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0013920098120515118 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.18828746764086687, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.002574176036533358 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.27233360792883826, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0027083132609021184 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.1949510570568441, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001804660306034504 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.86942295772908, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.08758910211106738 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..e97ce7159eff002d0c8e30df4d2c737bc7e27765 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.19702312634415606, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0035795334816332027 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.22825422304548265, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.003232347523636064 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.17391868610816388, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.002277407569748311 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.05667983844146617, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.002120538883847141 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.059228247136442105, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0015413764801780459 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.04463749924381735, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010686000964725524 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.15076982480282128, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0030098254531581766 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.17209850822866807, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0025209050965990243 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.12950729491278481, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.00167294588483517 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.1860026881384513, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.003405588840643614 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.21613806050396925, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0030779584306118175 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.1642422006919473, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002147002697595944 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 3.0330716712469843, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.09425863264675978 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..72ca160618ea341e522cd92f369ecc2d497b3947 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.06862907083042237, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0029137045746235116 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.07213602119470613, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002675324630242608 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.05441509889844838, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001922155872957772 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.019800771477798358, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0014215056199837948 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.019407609285097115, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0011737580125973422 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.014130696002074776, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0007469700039793996 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.054030861033230786, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.002428473990666629 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.055369844370012286, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0020897273452589395 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.04132917986525425, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001453754043869357 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.06581471030428865, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0028148588567455577 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.06855419478068313, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002540543323104449 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.051839091609912694, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.00182789753930337 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 0.4039582112595248, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03484552558450677 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..79b47e6da2a655543888ea734032ceb7e8c15cc9 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.010184074003326236, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001185280919251267 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.010530222683810939, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0010849872451804167 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.008187248278912505, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0008215139146136158 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.003045190089865129, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.000629256262446744 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.0025316582919952747, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.00035954782149502667 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.0020440057618351945, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0002894852867481284 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.00801661098513702, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0009926654487693505 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.007789272405875561, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0008037973390293996 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.006141492653296614, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.000619473069682991 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.009784563527498156, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0011539456656877766 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.009966706597956685, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.001029454113884746 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.007792108172262034, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0007861479859061975 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.0014137810446263e-08, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 5.022609361040328e-08 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..d051410e8c2fe916fb97ee5dd85b84c5405c20d3 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 0.1668198320527802, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.01897983257333898 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.030286876271392194, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.001036156882791465 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.027143500611213456, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0007465539304065285 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.022506347386715704, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0005868062207608241 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.0011223500556642703, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0002013011694364979 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.0015238484363635906, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.00022622383493949605 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.0010842906651617643, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0001636612072099844 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.029891451434790904, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0010048119314992631 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.027040559559811043, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0007436210949765598 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.022348380076958108, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0005776004107689916 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.02960870450534663, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0010175867142908736 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.025998503793795025, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0006867190478188373 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.02171066987180087, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0005513649905399339 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..f071bd1d3ff282444a20e216f9b1db45033a701c --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 11.497789088857585, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.1207333221383202 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5193372726053079, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0032827860366154518 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4187417243003722, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0029601462557396806 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.437040451945744, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002333774145212166 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.24404637097851045, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0025862116613527076 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.1933021952228981, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002111531045223336 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.20198550157867662, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0019395848816704526 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.3793149671052253, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0028788724723207175 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.303084323993645, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0023997981815417927 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.31702593617702457, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0020123220115816466 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.424766622860286, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0031065633020390844 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.34158689328494163, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027234093565780253 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3567272344346471, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002273204999670106 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..ea2d0bc9bac73ff48d2a397ac20c96c648f75122 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 13.232352061213327, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.18438572640282935 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5438295687735817, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0032626249125624544 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4519156735724399, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0028471232903033885 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.46686827804183195, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0021857893913537927 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2677592832314449, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002678442807946661 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.21857181845743923, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0021530696594196743 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.22608889723213235, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.001981518091728108 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.3988680585181114, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0029405304248634437 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3293160518559301, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002411675944122487 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.34083378350431404, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0020309168195614307 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.44900069330118875, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0031269512646810997 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3728742942560764, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002675120241181924 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.38531835059376945, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0022236074600925494 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..00420e851d5c06d2f095d1acc299bdbc9e6d97e1 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 14.1599321841023, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.1879116618302546 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5316343436240858, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0032625643740183926 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4648983433320942, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002828266123213244 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4695262322349431, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.00215490562453037 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.26457242284963084, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0026154624845308966 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2286713763984792, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002213558974457314 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.23062310394414082, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0019690665088102194 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.3891085104737073, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0029515533104354013 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3385179926519356, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002447035400467983 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3421096115443624, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0020310235455138293 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.44153945634327574, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003131733329038247 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3859861563616844, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027050660850819557 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3897046712016254, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0022104074028312126 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..4472709b522f1a9b86d6b7726f50fabfb8889426 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 14.215875217167579, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.19854834212398645 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5190910100984744, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003294663292154946 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.47129632991643877, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002752331164331658 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.46760558865318314, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0021274829390602406 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2607371623810947, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0026626721914091273 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.23271303570323362, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002186914450625737 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.23112566064185652, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.001973386702544114 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.37743317581253305, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002922501161012456 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3421754841859648, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002448897823883138 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.33922485306684963, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0020379531080847698 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.43332497676504134, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0031201843719093183 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.39450016226821116, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002683555554853958 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.39088870724203995, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0022061435555151025 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..700f7f138683f3d10d4a1539e1ecf753c5e91d72 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 13.675372357471726, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.1772679235890945 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5079146856634101, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003244631875951903 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4750602535272041, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002707456752563758 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4652741436608286, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0020856290234426084 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2506185278912072, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0025688729450509744 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.23020274907523836, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0021319283224229416 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.22596116871891767, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0019272220902171223 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.3646830222320307, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002836137970051408 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.34124704138322626, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002433024945476074 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3336418614264682, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0020082018536239574 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.42108375995240394, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003034856921594324 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3952453063898795, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0026571910552197976 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.38639018088252236, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0021588490021418913 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_0.json b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..00d70f6a8814625b93abfbe216f11bc149e2bbfb --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.17780010896090837, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0028657687702784394 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.33168127958194993, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0043909919411222464 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.2181226869116415, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0027581474749694035 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.03931279207892139, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0016581578355807393 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.07619599508022841, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.00272241500352495 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.048528921002958546, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0017764487817816764 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.13228242420416667, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0023035178337467654 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.24740150573619668, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003505699991405706 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.16205491808395142, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.002184657948901955 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.13792549177526942, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.002344912834751097 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.26116272332322926, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0038687142611478474 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.16995115866612748, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0023209836007670715 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.9965727451782298, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.15826205801047227 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_1.json b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..bd62ce84ccb1ce5e8da99e032308f99aaf9543c8 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.12623297679712753, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.00185031477682142 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.31355314687479174, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004381874835308543 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.17785826511919287, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002506168575309281 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.02671739102876372, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0010147304084239857 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06963018507899452, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002768236684178756 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.03812763380493433, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0014499362846337098 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.0989142119051423, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0013791496324926688 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.24757016935280626, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0034520987132384117 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.13961978647843165, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0018876284466631298 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.10042944590263467, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0015100489954681905 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2518445443289288, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003780328500383181 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.1418358500050043, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0020742150121420516 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.521961099148944, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.1067162997839333 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_2.json b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..c901a30f5c0ffcf1dc3d3904da280856625950f9 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.12776888363608563, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0018271531287357235 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.31621003695806416, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004292592593741099 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.17992305299553213, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002471474032703446 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.02713599956564803, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0010066515368428789 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.07048237066918879, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0027207468576705084 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.038746331277995295, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.001439750042341812 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.10123566070632635, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0013895764877661831 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.2528390510389675, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003483747346972295 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.14290468633219328, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0019087949950632504 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.10104760152172992, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0014792769919128913 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2530463368650048, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0037161332717751 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.14276376154853065, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.002040901548342001 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.5280857149419538, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.07885108475340596 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_3.json b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..f88cc551637701be8b8d9529a926c5f3bd39b24c --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.12121822408668065, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0020739133661264075 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.287891057927081, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004579134322254905 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.16685520709327625, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002665570155443094 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.024946562796427662, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0010295220175533656 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.062229435333035196, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0027102677143777706 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.03502142308268661, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.001453833565879767 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.09584883568666924, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0016019599062301714 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.22935087983395927, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003723896150091747 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.13219464959176125, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.002089625494358884 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.09677327103730465, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0016860407775182488 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.23249987999606497, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003931934403157173 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.13360679199458778, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0022032590659256113 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.521537278708307, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.1340390241992026 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_4.json b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..7c9d56b627027a92dc05d1b63b565dccee9ddcb7 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.038078096723767996, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0023781047408131164 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.07110840872162687, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0041655460986093325 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.04534730746066439, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002611229049263828 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.00755130939213845, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0009407309816817791 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.01456763376419491, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0015059193465168199 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.009137318621937963, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0009714552620996167 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.030895255217096195, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.002026498228282476 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.05673417944538178, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0033250538537188097 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.036178777224856525, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0020901567682781942 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.03193887181863606, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.002103908155038245 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.05872079534060702, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0034877968907706214 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.03747044675977351, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.002195978615372179 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.629879023989858, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.12544962320083983 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_5.json b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..54f4d78bb05f28bd5be2385da510f8d59461a6ab --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/generation/slim.4b284b84bc4v2seed4_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.0028153785061314713, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0008109014775672004 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.0022397022323243287, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0005923742999126791 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.0024480546534426002, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0006663143862102796 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.00032960010762452495, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0001942158416689748 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.00021523288032721994, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.00011457292554383501 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.00025593065551168283, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.00014085048380669117 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.0021686356526300445, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0006433045803199352 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.00171133818409571, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0004578910681243736 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.0018728301034077845, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0005184193716142723 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.0024191989997527706, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0007056629627390068 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.0019291072387565224, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0005158196897264791 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.0021046719353290323, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0005793875805849997 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 8.029951400668467e-38, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 8.999389473215882e-33 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4v2seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/rankeval/4b284b84bc4v2seed4_0.json b/4b284b84bc4v2seed4/evaluation/rankeval/4b284b84bc4v2seed4_0.json new file mode 100644 index 0000000000000000000000000000000000000000..b32521d8f01d8f7c607d2551e27e155422831017 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/rankeval/4b284b84bc4v2seed4_0.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.323, + "acc_stderr": 0.01479492784334864 + }, + "anli_r2": { + "acc": 0.35, + "acc_stderr": 0.015090650341444233 + }, + "anli_r3": { + "acc": 0.3441666666666667, + "acc_stderr": 0.013720551062295755 + }, + "cb": { + "acc": 0.3392857142857143, + "acc_stderr": 0.06384226561930825, + "f1": 0.26343091936312274 + }, + "copa": { + "acc": 0.72, + "acc_stderr": 0.04512608598542127 + }, + "hellaswag": { + "acc": 0.475502887870942, + "acc_stderr": 0.004983788992681198, + "acc_norm": 0.6266679944234216, + "acc_norm_stderr": 0.004827006520802888 + }, + "rte": { + "acc": 0.5631768953068592, + "acc_stderr": 0.02985524739031495 + }, + "winogrande": { + "acc": 0.5761641673243884, + "acc_stderr": 0.013888492389944508 + }, + "storycloze_2016": { + "acc": 0.7156600748262961, + "acc_stderr": 0.01043161412866525 + }, + "boolq": { + "acc": 0.5886850152905199, + "acc_stderr": 0.008606395426309208 + }, + "arc_easy": { + "acc": 0.5989057239057239, + "acc_stderr": 0.01005705110653437, + "acc_norm": 0.5425084175084175, + "acc_norm_stderr": 0.010222638127749496 + }, + "arc_challenge": { + "acc": 0.2790102389078498, + "acc_stderr": 0.013106784883601336, + "acc_norm": 0.3046075085324232, + "acc_norm_stderr": 0.01344952210993249 + }, + "sciq": { + "acc": 0.849, + "acc_stderr": 0.011328165223341671, + "acc_norm": 0.757, + "acc_norm_stderr": 0.013569640199177451 + }, + "piqa": { + "acc": 0.7551686615886833, + "acc_stderr": 0.010032309105568793, + "acc_norm": 0.763873775843308, + "acc_norm_stderr": 0.009908965890558216 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/rankeval/4b284b84bc4v2seed4_0_lm-eval_global_step80108_2023-02-24-15-37-25_0shots_backup.json b/4b284b84bc4v2seed4/evaluation/rankeval/4b284b84bc4v2seed4_0_lm-eval_global_step80108_2023-02-24-15-37-25_0shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..b32521d8f01d8f7c607d2551e27e155422831017 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/rankeval/4b284b84bc4v2seed4_0_lm-eval_global_step80108_2023-02-24-15-37-25_0shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.323, + "acc_stderr": 0.01479492784334864 + }, + "anli_r2": { + "acc": 0.35, + "acc_stderr": 0.015090650341444233 + }, + "anli_r3": { + "acc": 0.3441666666666667, + "acc_stderr": 0.013720551062295755 + }, + "cb": { + "acc": 0.3392857142857143, + "acc_stderr": 0.06384226561930825, + "f1": 0.26343091936312274 + }, + "copa": { + "acc": 0.72, + "acc_stderr": 0.04512608598542127 + }, + "hellaswag": { + "acc": 0.475502887870942, + "acc_stderr": 0.004983788992681198, + "acc_norm": 0.6266679944234216, + "acc_norm_stderr": 0.004827006520802888 + }, + "rte": { + "acc": 0.5631768953068592, + "acc_stderr": 0.02985524739031495 + }, + "winogrande": { + "acc": 0.5761641673243884, + "acc_stderr": 0.013888492389944508 + }, + "storycloze_2016": { + "acc": 0.7156600748262961, + "acc_stderr": 0.01043161412866525 + }, + "boolq": { + "acc": 0.5886850152905199, + "acc_stderr": 0.008606395426309208 + }, + "arc_easy": { + "acc": 0.5989057239057239, + "acc_stderr": 0.01005705110653437, + "acc_norm": 0.5425084175084175, + "acc_norm_stderr": 0.010222638127749496 + }, + "arc_challenge": { + "acc": 0.2790102389078498, + "acc_stderr": 0.013106784883601336, + "acc_norm": 0.3046075085324232, + "acc_norm_stderr": 0.01344952210993249 + }, + "sciq": { + "acc": 0.849, + "acc_stderr": 0.011328165223341671, + "acc_norm": 0.757, + "acc_norm_stderr": 0.013569640199177451 + }, + "piqa": { + "acc": 0.7551686615886833, + "acc_stderr": 0.010032309105568793, + "acc_norm": 0.763873775843308, + "acc_norm_stderr": 0.009908965890558216 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/rankeval/4b284b84bc4v2seed4_1.json b/4b284b84bc4v2seed4/evaluation/rankeval/4b284b84bc4v2seed4_1.json new file mode 100644 index 0000000000000000000000000000000000000000..add8df2245b74afd79809099e62b7286cf26af96 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/rankeval/4b284b84bc4v2seed4_1.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.314, + "acc_stderr": 0.014683991951087966 + }, + "anli_r2": { + "acc": 0.319, + "acc_stderr": 0.014746404865473477 + }, + "anli_r3": { + "acc": 0.3475, + "acc_stderr": 0.013751753243291852 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.0663363415035954, + "f1": 0.3282195387458545 + }, + "copa": { + "acc": 0.76, + "acc_stderr": 0.04292346959909283 + }, + "hellaswag": { + "acc": 0.47321250746863175, + "acc_stderr": 0.004982615233057104, + "acc_norm": 0.6222863971320454, + "acc_norm_stderr": 0.004838246410786253 + }, + "rte": { + "acc": 0.5487364620938628, + "acc_stderr": 0.029953149241808946 + }, + "winogrande": { + "acc": 0.5706393054459353, + "acc_stderr": 0.013911537499969179 + }, + "storycloze_2016": { + "acc": 0.7049706039551042, + "acc_stderr": 0.010546232606962287 + }, + "boolq": { + "acc": 0.5957186544342508, + "acc_stderr": 0.008583313811372076 + }, + "arc_easy": { + "acc": 0.617003367003367, + "acc_stderr": 0.009974920384536469, + "acc_norm": 0.5744949494949495, + "acc_norm_stderr": 0.010145271182591026 + }, + "arc_challenge": { + "acc": 0.29436860068259385, + "acc_stderr": 0.013318528460539426, + "acc_norm": 0.32337883959044367, + "acc_norm_stderr": 0.013669421630012132 + }, + "sciq": { + "acc": 0.884, + "acc_stderr": 0.010131468138756995, + "acc_norm": 0.859, + "acc_norm_stderr": 0.011010914595992443 + }, + "piqa": { + "acc": 0.7540805223068553, + "acc_stderr": 0.010047331865625191, + "acc_norm": 0.7584330794341676, + "acc_norm_stderr": 0.009986718001804454 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/rankeval/4b284b84bc4v2seed4_1_lm-eval_global_step80108_2023-02-24-15-37-25_1shots_backup.json b/4b284b84bc4v2seed4/evaluation/rankeval/4b284b84bc4v2seed4_1_lm-eval_global_step80108_2023-02-24-15-37-25_1shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..add8df2245b74afd79809099e62b7286cf26af96 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/rankeval/4b284b84bc4v2seed4_1_lm-eval_global_step80108_2023-02-24-15-37-25_1shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.314, + "acc_stderr": 0.014683991951087966 + }, + "anli_r2": { + "acc": 0.319, + "acc_stderr": 0.014746404865473477 + }, + "anli_r3": { + "acc": 0.3475, + "acc_stderr": 0.013751753243291852 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.0663363415035954, + "f1": 0.3282195387458545 + }, + "copa": { + "acc": 0.76, + "acc_stderr": 0.04292346959909283 + }, + "hellaswag": { + "acc": 0.47321250746863175, + "acc_stderr": 0.004982615233057104, + "acc_norm": 0.6222863971320454, + "acc_norm_stderr": 0.004838246410786253 + }, + "rte": { + "acc": 0.5487364620938628, + "acc_stderr": 0.029953149241808946 + }, + "winogrande": { + "acc": 0.5706393054459353, + "acc_stderr": 0.013911537499969179 + }, + "storycloze_2016": { + "acc": 0.7049706039551042, + "acc_stderr": 0.010546232606962287 + }, + "boolq": { + "acc": 0.5957186544342508, + "acc_stderr": 0.008583313811372076 + }, + "arc_easy": { + "acc": 0.617003367003367, + "acc_stderr": 0.009974920384536469, + "acc_norm": 0.5744949494949495, + "acc_norm_stderr": 0.010145271182591026 + }, + "arc_challenge": { + "acc": 0.29436860068259385, + "acc_stderr": 0.013318528460539426, + "acc_norm": 0.32337883959044367, + "acc_norm_stderr": 0.013669421630012132 + }, + "sciq": { + "acc": 0.884, + "acc_stderr": 0.010131468138756995, + "acc_norm": 0.859, + "acc_norm_stderr": 0.011010914595992443 + }, + "piqa": { + "acc": 0.7540805223068553, + "acc_stderr": 0.010047331865625191, + "acc_norm": 0.7584330794341676, + "acc_norm_stderr": 0.009986718001804454 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/rankeval/4b284b84bc4v2seed4_2.json b/4b284b84bc4v2seed4/evaluation/rankeval/4b284b84bc4v2seed4_2.json new file mode 100644 index 0000000000000000000000000000000000000000..8e961a9c331db0036f933002c7fc889aaa180731 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/rankeval/4b284b84bc4v2seed4_2.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.326, + "acc_stderr": 0.014830507204541056 + }, + "anli_r2": { + "acc": 0.321, + "acc_stderr": 0.014770821817934644 + }, + "anli_r3": { + "acc": 0.3308333333333333, + "acc_stderr": 0.013588208070708997 + }, + "cb": { + "acc": 0.375, + "acc_stderr": 0.06527912098338669, + "f1": 0.2692307692307692 + }, + "copa": { + "acc": 0.75, + "acc_stderr": 0.04351941398892446 + }, + "hellaswag": { + "acc": 0.4715196176060546, + "acc_stderr": 0.004981680090303695, + "acc_norm": 0.6208922525393348, + "acc_norm_stderr": 0.004841734453506668 + }, + "rte": { + "acc": 0.48375451263537905, + "acc_stderr": 0.030080573208738064 + }, + "winogrande": { + "acc": 0.574585635359116, + "acc_stderr": 0.013895257666646382 + }, + "storycloze_2016": { + "acc": 0.7183324425440941, + "acc_stderr": 0.010401844358587665 + }, + "boolq": { + "acc": 0.6039755351681957, + "acc_stderr": 0.008553881336813413 + }, + "arc_easy": { + "acc": 0.6191077441077442, + "acc_stderr": 0.009964428212260372, + "acc_norm": 0.5921717171717171, + "acc_norm_stderr": 0.010083950240041223 + }, + "arc_challenge": { + "acc": 0.302901023890785, + "acc_stderr": 0.013428241573185349, + "acc_norm": 0.3174061433447099, + "acc_norm_stderr": 0.01360223908803817 + }, + "sciq": { + "acc": 0.899, + "acc_stderr": 0.009533618929340997, + "acc_norm": 0.877, + "acc_norm_stderr": 0.010391293421849877 + }, + "piqa": { + "acc": 0.7524483133841132, + "acc_stderr": 0.010069703966857104, + "acc_norm": 0.7633297062023939, + "acc_norm_stderr": 0.009916841655042809 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/rankeval/4b284b84bc4v2seed4_2_lm-eval_global_step80108_2023-02-24-15-37-26_2shots_backup.json b/4b284b84bc4v2seed4/evaluation/rankeval/4b284b84bc4v2seed4_2_lm-eval_global_step80108_2023-02-24-15-37-26_2shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..8e961a9c331db0036f933002c7fc889aaa180731 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/rankeval/4b284b84bc4v2seed4_2_lm-eval_global_step80108_2023-02-24-15-37-26_2shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.326, + "acc_stderr": 0.014830507204541056 + }, + "anli_r2": { + "acc": 0.321, + "acc_stderr": 0.014770821817934644 + }, + "anli_r3": { + "acc": 0.3308333333333333, + "acc_stderr": 0.013588208070708997 + }, + "cb": { + "acc": 0.375, + "acc_stderr": 0.06527912098338669, + "f1": 0.2692307692307692 + }, + "copa": { + "acc": 0.75, + "acc_stderr": 0.04351941398892446 + }, + "hellaswag": { + "acc": 0.4715196176060546, + "acc_stderr": 0.004981680090303695, + "acc_norm": 0.6208922525393348, + "acc_norm_stderr": 0.004841734453506668 + }, + "rte": { + "acc": 0.48375451263537905, + "acc_stderr": 0.030080573208738064 + }, + "winogrande": { + "acc": 0.574585635359116, + "acc_stderr": 0.013895257666646382 + }, + "storycloze_2016": { + "acc": 0.7183324425440941, + "acc_stderr": 0.010401844358587665 + }, + "boolq": { + "acc": 0.6039755351681957, + "acc_stderr": 0.008553881336813413 + }, + "arc_easy": { + "acc": 0.6191077441077442, + "acc_stderr": 0.009964428212260372, + "acc_norm": 0.5921717171717171, + "acc_norm_stderr": 0.010083950240041223 + }, + "arc_challenge": { + "acc": 0.302901023890785, + "acc_stderr": 0.013428241573185349, + "acc_norm": 0.3174061433447099, + "acc_norm_stderr": 0.01360223908803817 + }, + "sciq": { + "acc": 0.899, + "acc_stderr": 0.009533618929340997, + "acc_norm": 0.877, + "acc_norm_stderr": 0.010391293421849877 + }, + "piqa": { + "acc": 0.7524483133841132, + "acc_stderr": 0.010069703966857104, + "acc_norm": 0.7633297062023939, + "acc_norm_stderr": 0.009916841655042809 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/rankeval/4b284b84bc4v2seed4_3.json b/4b284b84bc4v2seed4/evaluation/rankeval/4b284b84bc4v2seed4_3.json new file mode 100644 index 0000000000000000000000000000000000000000..21b41f0b389920760579eb067c5abd57e9f956bd --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/rankeval/4b284b84bc4v2seed4_3.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.306, + "acc_stderr": 0.014580006055436967 + }, + "anli_r2": { + "acc": 0.361, + "acc_stderr": 0.015195720118175122 + }, + "anli_r3": { + "acc": 0.31583333333333335, + "acc_stderr": 0.01342456883035645 + }, + "cb": { + "acc": 0.35714285714285715, + "acc_stderr": 0.06460957383809221, + "f1": 0.2902724515627741 + }, + "copa": { + "acc": 0.81, + "acc_stderr": 0.03942772444036623 + }, + "hellaswag": { + "acc": 0.4742083250348536, + "acc_stderr": 0.0049831384796043795, + "acc_norm": 0.6274646484763992, + "acc_norm_stderr": 0.004824917516374194 + }, + "rte": { + "acc": 0.5667870036101083, + "acc_stderr": 0.029826764082138277 + }, + "winogrande": { + "acc": 0.580110497237569, + "acc_stderr": 0.013870943986310391 + }, + "storycloze_2016": { + "acc": 0.7167290219134153, + "acc_stderr": 0.010419760409155363 + }, + "boolq": { + "acc": 0.6042813455657492, + "acc_stderr": 0.008552742471459792 + }, + "arc_easy": { + "acc": 0.622895622895623, + "acc_stderr": 0.009945041946366515, + "acc_norm": 0.6035353535353535, + "acc_norm_stderr": 0.01003741276306453 + }, + "arc_challenge": { + "acc": 0.30119453924914674, + "acc_stderr": 0.01340674176784762, + "acc_norm": 0.3250853242320819, + "acc_norm_stderr": 0.013688147309729122 + }, + "sciq": { + "acc": 0.897, + "acc_stderr": 0.009616833339695798, + "acc_norm": 0.882, + "acc_norm_stderr": 0.010206869264381791 + }, + "piqa": { + "acc": 0.7573449401523396, + "acc_stderr": 0.0100020025697087, + "acc_norm": 0.764417845484222, + "acc_norm_stderr": 0.009901067586473893 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/rankeval/4b284b84bc4v2seed4_3_lm-eval_global_step80108_2023-02-24-15-37-26_3shots_backup.json b/4b284b84bc4v2seed4/evaluation/rankeval/4b284b84bc4v2seed4_3_lm-eval_global_step80108_2023-02-24-15-37-26_3shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..21b41f0b389920760579eb067c5abd57e9f956bd --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/rankeval/4b284b84bc4v2seed4_3_lm-eval_global_step80108_2023-02-24-15-37-26_3shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.306, + "acc_stderr": 0.014580006055436967 + }, + "anli_r2": { + "acc": 0.361, + "acc_stderr": 0.015195720118175122 + }, + "anli_r3": { + "acc": 0.31583333333333335, + "acc_stderr": 0.01342456883035645 + }, + "cb": { + "acc": 0.35714285714285715, + "acc_stderr": 0.06460957383809221, + "f1": 0.2902724515627741 + }, + "copa": { + "acc": 0.81, + "acc_stderr": 0.03942772444036623 + }, + "hellaswag": { + "acc": 0.4742083250348536, + "acc_stderr": 0.0049831384796043795, + "acc_norm": 0.6274646484763992, + "acc_norm_stderr": 0.004824917516374194 + }, + "rte": { + "acc": 0.5667870036101083, + "acc_stderr": 0.029826764082138277 + }, + "winogrande": { + "acc": 0.580110497237569, + "acc_stderr": 0.013870943986310391 + }, + "storycloze_2016": { + "acc": 0.7167290219134153, + "acc_stderr": 0.010419760409155363 + }, + "boolq": { + "acc": 0.6042813455657492, + "acc_stderr": 0.008552742471459792 + }, + "arc_easy": { + "acc": 0.622895622895623, + "acc_stderr": 0.009945041946366515, + "acc_norm": 0.6035353535353535, + "acc_norm_stderr": 0.01003741276306453 + }, + "arc_challenge": { + "acc": 0.30119453924914674, + "acc_stderr": 0.01340674176784762, + "acc_norm": 0.3250853242320819, + "acc_norm_stderr": 0.013688147309729122 + }, + "sciq": { + "acc": 0.897, + "acc_stderr": 0.009616833339695798, + "acc_norm": 0.882, + "acc_norm_stderr": 0.010206869264381791 + }, + "piqa": { + "acc": 0.7573449401523396, + "acc_stderr": 0.0100020025697087, + "acc_norm": 0.764417845484222, + "acc_norm_stderr": 0.009901067586473893 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/rankeval/4b284b84bc4v2seed4_4.json b/4b284b84bc4v2seed4/evaluation/rankeval/4b284b84bc4v2seed4_4.json new file mode 100644 index 0000000000000000000000000000000000000000..1dfa15c148c4961db73d79b0191b5560e91df659 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/rankeval/4b284b84bc4v2seed4_4.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.347, + "acc_stderr": 0.015060472031706622 + }, + "anli_r2": { + "acc": 0.361, + "acc_stderr": 0.015195720118175127 + }, + "anli_r3": { + "acc": 0.34, + "acc_stderr": 0.013680495725767787 + }, + "cb": { + "acc": 0.375, + "acc_stderr": 0.06527912098338669, + "f1": 0.266719222178426 + }, + "copa": { + "acc": 0.82, + "acc_stderr": 0.038612291966536955 + }, + "hellaswag": { + "acc": 0.47400916152160927, + "acc_stderr": 0.004983035420235718, + "acc_norm": 0.6275642302330213, + "acc_norm_stderr": 0.004824655406075563 + }, + "rte": { + "acc": 0.4981949458483754, + "acc_stderr": 0.030096267148976626 + }, + "winogrande": { + "acc": 0.584846093133386, + "acc_stderr": 0.013848684086658585 + }, + "storycloze_2016": { + "acc": 0.7247461250668092, + "acc_stderr": 0.010328538400500567 + }, + "boolq": { + "acc": 0.5984709480122324, + "acc_stderr": 0.008573784490094754 + }, + "arc_easy": { + "acc": 0.6283670033670034, + "acc_stderr": 0.009915897123658788, + "acc_norm": 0.5972222222222222, + "acc_norm_stderr": 0.010063960494989163 + }, + "arc_challenge": { + "acc": 0.30119453924914674, + "acc_stderr": 0.01340674176784762, + "acc_norm": 0.3370307167235495, + "acc_norm_stderr": 0.013813476652902269 + }, + "sciq": { + "acc": 0.911, + "acc_stderr": 0.009008893392651518, + "acc_norm": 0.898, + "acc_norm_stderr": 0.009575368801653892 + }, + "piqa": { + "acc": 0.7546245919477693, + "acc_stderr": 0.010039831320422396, + "acc_norm": 0.766050054406964, + "acc_norm_stderr": 0.009877236895137446 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/rankeval/4b284b84bc4v2seed4_4_lm-eval_global_step80108_2023-02-24-15-37-26_4shots_backup.json b/4b284b84bc4v2seed4/evaluation/rankeval/4b284b84bc4v2seed4_4_lm-eval_global_step80108_2023-02-24-15-37-26_4shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..1dfa15c148c4961db73d79b0191b5560e91df659 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/rankeval/4b284b84bc4v2seed4_4_lm-eval_global_step80108_2023-02-24-15-37-26_4shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.347, + "acc_stderr": 0.015060472031706622 + }, + "anli_r2": { + "acc": 0.361, + "acc_stderr": 0.015195720118175127 + }, + "anli_r3": { + "acc": 0.34, + "acc_stderr": 0.013680495725767787 + }, + "cb": { + "acc": 0.375, + "acc_stderr": 0.06527912098338669, + "f1": 0.266719222178426 + }, + "copa": { + "acc": 0.82, + "acc_stderr": 0.038612291966536955 + }, + "hellaswag": { + "acc": 0.47400916152160927, + "acc_stderr": 0.004983035420235718, + "acc_norm": 0.6275642302330213, + "acc_norm_stderr": 0.004824655406075563 + }, + "rte": { + "acc": 0.4981949458483754, + "acc_stderr": 0.030096267148976626 + }, + "winogrande": { + "acc": 0.584846093133386, + "acc_stderr": 0.013848684086658585 + }, + "storycloze_2016": { + "acc": 0.7247461250668092, + "acc_stderr": 0.010328538400500567 + }, + "boolq": { + "acc": 0.5984709480122324, + "acc_stderr": 0.008573784490094754 + }, + "arc_easy": { + "acc": 0.6283670033670034, + "acc_stderr": 0.009915897123658788, + "acc_norm": 0.5972222222222222, + "acc_norm_stderr": 0.010063960494989163 + }, + "arc_challenge": { + "acc": 0.30119453924914674, + "acc_stderr": 0.01340674176784762, + "acc_norm": 0.3370307167235495, + "acc_norm_stderr": 0.013813476652902269 + }, + "sciq": { + "acc": 0.911, + "acc_stderr": 0.009008893392651518, + "acc_norm": 0.898, + "acc_norm_stderr": 0.009575368801653892 + }, + "piqa": { + "acc": 0.7546245919477693, + "acc_stderr": 0.010039831320422396, + "acc_norm": 0.766050054406964, + "acc_norm_stderr": 0.009877236895137446 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/rankeval/4b284b84bc4v2seed4_5.json b/4b284b84bc4v2seed4/evaluation/rankeval/4b284b84bc4v2seed4_5.json new file mode 100644 index 0000000000000000000000000000000000000000..c19fa92879d665ed88cd89445cedfd9cbf1faa77 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/rankeval/4b284b84bc4v2seed4_5.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.334, + "acc_stderr": 0.014922019523732977 + }, + "anli_r2": { + "acc": 0.351, + "acc_stderr": 0.015100563798316407 + }, + "anli_r3": { + "acc": 0.32083333333333336, + "acc_stderr": 0.013480882752851543 + }, + "cb": { + "acc": 0.42857142857142855, + "acc_stderr": 0.06672848092813058, + "f1": 0.2943692088382039 + }, + "copa": { + "acc": 0.77, + "acc_stderr": 0.04229525846816506 + }, + "hellaswag": { + "acc": 0.472814180442143, + "acc_stderr": 0.004982400368939667, + "acc_norm": 0.6304521011750648, + "acc_norm_stderr": 0.00481695881772609 + }, + "rte": { + "acc": 0.5415162454873647, + "acc_stderr": 0.029992535385373314 + }, + "winogrande": { + "acc": 0.5911602209944752, + "acc_stderr": 0.0138169542951357 + }, + "storycloze_2016": { + "acc": 0.7188669160876536, + "acc_stderr": 0.0103958360916281 + }, + "boolq": { + "acc": 0.6073394495412844, + "acc_stderr": 0.008541161248702913 + }, + "arc_easy": { + "acc": 0.6258417508417509, + "acc_stderr": 0.009929516948977627, + "acc_norm": 0.6022727272727273, + "acc_norm_stderr": 0.010042861602178058 + }, + "arc_challenge": { + "acc": 0.3003412969283277, + "acc_stderr": 0.013395909309956995, + "acc_norm": 0.3225255972696246, + "acc_norm_stderr": 0.013659980894277373 + }, + "sciq": { + "acc": 0.914, + "acc_stderr": 0.008870325962594766, + "acc_norm": 0.901, + "acc_norm_stderr": 0.009449248027662734 + }, + "piqa": { + "acc": 0.7513601741022851, + "acc_stderr": 0.010084511234296852, + "acc_norm": 0.7687704026115343, + "acc_norm_stderr": 0.009837063180625336 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/evaluation/rankeval/4b284b84bc4v2seed4_5_lm-eval_global_step80108_2023-02-24-15-37-25_5shots_backup.json b/4b284b84bc4v2seed4/evaluation/rankeval/4b284b84bc4v2seed4_5_lm-eval_global_step80108_2023-02-24-15-37-25_5shots_backup.json new file mode 100644 index 0000000000000000000000000000000000000000..c19fa92879d665ed88cd89445cedfd9cbf1faa77 --- /dev/null +++ b/4b284b84bc4v2seed4/evaluation/rankeval/4b284b84bc4v2seed4_5_lm-eval_global_step80108_2023-02-24-15-37-25_5shots_backup.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.334, + "acc_stderr": 0.014922019523732977 + }, + "anli_r2": { + "acc": 0.351, + "acc_stderr": 0.015100563798316407 + }, + "anli_r3": { + "acc": 0.32083333333333336, + "acc_stderr": 0.013480882752851543 + }, + "cb": { + "acc": 0.42857142857142855, + "acc_stderr": 0.06672848092813058, + "f1": 0.2943692088382039 + }, + "copa": { + "acc": 0.77, + "acc_stderr": 0.04229525846816506 + }, + "hellaswag": { + "acc": 0.472814180442143, + "acc_stderr": 0.004982400368939667, + "acc_norm": 0.6304521011750648, + "acc_norm_stderr": 0.00481695881772609 + }, + "rte": { + "acc": 0.5415162454873647, + "acc_stderr": 0.029992535385373314 + }, + "winogrande": { + "acc": 0.5911602209944752, + "acc_stderr": 0.0138169542951357 + }, + "storycloze_2016": { + "acc": 0.7188669160876536, + "acc_stderr": 0.0103958360916281 + }, + "boolq": { + "acc": 0.6073394495412844, + "acc_stderr": 0.008541161248702913 + }, + "arc_easy": { + "acc": 0.6258417508417509, + "acc_stderr": 0.009929516948977627, + "acc_norm": 0.6022727272727273, + "acc_norm_stderr": 0.010042861602178058 + }, + "arc_challenge": { + "acc": 0.3003412969283277, + "acc_stderr": 0.013395909309956995, + "acc_norm": 0.3225255972696246, + "acc_norm_stderr": 0.013659980894277373 + }, + "sciq": { + "acc": 0.914, + "acc_stderr": 0.008870325962594766, + "acc_norm": 0.901, + "acc_norm_stderr": 0.009449248027662734 + }, + "piqa": { + "acc": 0.7513601741022851, + "acc_stderr": 0.010084511234296852, + "acc_norm": 0.7687704026115343, + "acc_norm_stderr": 0.009837063180625336 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0987e2debcec20d154edca9111711057cdee921 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3874db92128255c37abc9db653d69ff5e1bf626defb6ae16180c1ce5ec75ae26 +size 199058647 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..65c261d072b82d73f5f592bb37b1ebe13b695b57 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afa316b54dc723de15ab0d113d27d0fed890c8b2ba1c2ccbb5ec406de1ce6f8c +size 199058647 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbe16bb357750e6a7923e5ac7e4a0716f4dbc0da --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b0e9a004589aa8cbc8dd5e3a61ce94f00702c480fad6277b8578c0357b93216 +size 199058733 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb8aada65086355218ac45f4ae41957fc0870127 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:543943b69d9853547c8e218cbf9cb1dafe597344a5908b313320f824cb280975 +size 199058733 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9e31d6b0fa4da70eac54732e2fad1ecc501119d --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dda902b7fb4fdd8bcf94edfffc9d271d030099896f00e3bb3957502e49142c1 +size 199058797 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..49e14ab43e3db00763d7f08150e6e0438af36360 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3ef037fa7c943b76559a8c6d58d104ba459e18a8973bc41a0a45d39be24ab5b +size 199058797 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..02e516ff287bc5fc299d163e06afa238089c682d --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:202ba1c2a825a816d04bcabb56f20a24f9ff9a6972130cc8ae7ae00d7fb13906 +size 199058733 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b75ff0f0ab07277a17e623c6c7c8ffe07eb985af --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93f6923fbe21a380151a003ffc373a804456cd4ca6013031681576202c4533ac +size 199058733 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b75504d1ffd8b056f870851adaa327fdc0aa8f6e --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c821fbb24d28f30b7afffca78b49090d39843667297e68a91de74b67c02c1726 +size 199058733 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99f3d5ab046ef311570a1591d4f1734f5d1f4306 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8daeae3407f4585ccdb0a6ca0a9ca395fc605ad7c2c46708d58a2981d4c3abfc +size 199058733 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eaa920b7c16bd458799a6415ce1ef6ee11f2efe0 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c93853e80c4644e319888bc58247f21a984d6176ff7192b67becb974e11b2df +size 199058797 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ab1f6a0dce83b9381adaf38b320a0c4e0e55d5f --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b92dd24272ec564048b08b5f177078bb66a1da59a57c2cddcde4cefefc7e13b5 +size 199058797 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dafc8f10fb227e5db5debcc01f8770e7492a2b5a --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0366415d5ef90bd7000ecdf68356808d47de37d1135cb1ac45aca686ea84cffe +size 199058733 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3df2bc079d2e3ed2de47be0fc919fe50ea8489d0 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeb7fcbe427a2e6d115d87e9987ff6bb4ab7f2063c0d8142e6c18ca5729635ba +size 199058733 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..780290c2c7d8e0174d848a7cd108f81ee8aab1dd --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eaf53782e8dca72bdf6d50ca933d27573b3cdecd9c3d735975193f539aa1545f +size 199058669 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b1af3ec20317d8a7c4455c76efb77974f021727 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f7a527b2cc20e81327fb0fb221b80ce10d29f88d98a7628c623cfb9b818bd1a +size 199058669 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0a3a07c803b2366e05ed2093230fee6b2e61c39 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:767e53d430b403b9426eecc6b614191e8e426bf5b22389d4155add94e5839315 +size 199058797 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a788ee4d0fa61aa7dd4eae743dd6364de86253ef --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc0c556935964ddb8010ffcb60b4977d800022013cf5523909120d0ecdcefa98 +size 199058797 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff56607390162cb8bca387555b7f53c49e960813 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4b9f40bff2fd2a20c75aa74bbeeb2950dcb10f5c8a4466ac9c8018185d9f391 +size 199058733 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c51a5f65925d51d8e0043c98e7cc9642ff722d37 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:679a2877e7c4b37d59069a4b247e1c4cb52a8c3423f5e34ad99d239b51953176 +size 199058733 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6750c97f9fee919c49e0059bca76a708cd414aa3 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79f45c983012716dad638c92710679c965a209d6e529adf3829991ceaeadaae8 +size 199058733 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..35a351932cd618ac140835ed24c4d0badfef8ff8 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60d1ea3540a44245a02db8d36aba9cf2db43a5ba932e7a514915d4e533b3cf75 +size 199058733 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..298e6e35e3225ef6987f363e71c9f351ac95120b --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1eebdad0c02072a193ac381648dda87622639cf9511e13fee172e75ee0a24c84 +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..87f1f17b904d2804b12f6e0ef237bf718663d166 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd863b08e8c2b2928de1256eedcb2c4e3ac5eb166aabe60c0fcb904c1ebcfb99 +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0513394fad3eabe8dcdb13c1aa9786c2ef65c4c --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3facad4d357c962509ea3c29233626a215f318bb83951055f401db64c0aa52c8 +size 199058733 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fae99c31dcac8a1d16cafa2b4ad1a7cafd64344 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fd562de711bdad55db1b5c2a37afaea5466b1de6fb9c2656adc2caf3de3d29b +size 199058733 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eecc7d32a527458f72105a0b8dde2ed9ce06117f --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b3efb726faba42c509c16ffef057b2498094ef4fde49ccceca103e9076146b6 +size 199058797 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f06bf66f7e6335111e91f1339c9037fd5f61a503 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:440fa04cc095301bc307828a065577a57f466c6aa4e963e1810037ff0e9a9689 +size 199058797 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e03a674bc6dca1c58f63b692ffc0629f1170452b --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01223eaf17e4635ee20ec6382363cc3c98393356777659689e01a926b7529719 +size 199058605 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7335688aceae08847cd72393fc4bf598f5aa0c6d --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a0739b293050fcc0b2fd634f2cab75cd6486285fab14f4d8e0343192a4ea4a6 +size 199058605 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a831bb28fe2b061a07c83c3e05feced3e17f86b --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:965fd7946678c493de7811099911b565f81ffb2d07f675857919071141b3f8fd +size 199058669 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..13ea342f68a2e7d310ee2a478e49f9e142934755 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:829e8a61870478a87fa5e7f5332758292cfa5cda9cd9932b6c99d2b396c623ef +size 199058669 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5483bd8ceceade39a95aa02ed46c4ca67924505e --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f32196ad78ddb73595ef3f63f49a0635cde4bc849adf59fd363f85b7d23294b5 +size 199058797 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5137804bce8a4bcba25b3518ef3f9ae4e4d39d3c --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91f25e35702bc99caa1d12e5a256e3abfe6be0d9c46ba1d1f5473a0e03d1d571 +size 199058797 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a52c020a6097e6e7a309b6e91fd62a67fa687a4 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06c8f070007737e98e31dcb13dbbef5e7173c28ef1109151424ec6b055b45cc7 +size 199058733 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b59c3f99a9d8b6d370c677f9df02332b78be2ed5 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f578e99e42da3e5ff17d4046239dc77cfaa1c7735d085b272bdd22b59b6a33a4 +size 199058733 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f033d74661e75462ca7fd06d59900ddc1c403898 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b44819143d2b3f51884d1afb039ffa934bcd45078d06a8035c51a7b6322121b +size 199058733 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab0ee24e60acaebc0ee54512fdb986091e048e83 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e76d50bf92f58f8358a32eb0a5aecf746eb51201521cd44083e470fa50b0933 +size 199058733 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd8734566e1389236b0d9a198144852bacae2a45 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:800d62529b110632c0eec8dd4d2a68cdf27b3969f674c2bc1f3bc62a27dacf03 +size 199058733 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a659264783c2d54f422133d1ad3d54bb2df1f00 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c040cbe628a8ff3347c64a4031121480855e344f1bd92ff21919fb764c5d7bd +size 199058733 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2ea3dd6379f9c9503d6b37a3bdad8cd80302307 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7f745b2715509022f925145082e7aed962d2e7de6810e3241eec26c6b42666b +size 199058797 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..856ce4e076a005b72ae5c087139f2ac2b22ae759 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f44b98a7b0e0e0dfc235117034d499653aba5fbeeb60109c852be460593c4d5 +size 199058797 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..97cff98274acaa6a888b93013673ca64d79913a1 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b13b5b87e70e5b8809d1e57cf0b7821971990ad47717b3c5e7ee83a4807b361 +size 199058669 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5848956fe7ba44fc0cd7a30c07dd9a369a353eb --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce0423c05dabc95dbc9a0f5d92deaa44a1ee461329ee45115ecede7ad850ff29 +size 199058669 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..763701c0ea1ba327184679a3c1925aa92c30a185 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82dc5aceaa09aa913940b66259ffdbd99d954efcf65e66f04862e608e74a880d +size 199058850 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b16df6f57a77eb08292bf73e0eeae705ae9bf989 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce21c9e18ffc54ebe20688a8c674ce3c51493f01f3e7ea28b9ec13de8a41206e +size 199058850 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2310f7e8d7a0e2efaedf79a313cb915c45d569e4 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bb990628926eb6b22b5329ef16023d4624d34b27bf7546a52cb2229ce9dddb3 +size 199058669 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8819eb4f04017c49f7c638ca8c5ff44f84051b49 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14fb5349582ffb431d19e6f877395958380b69051db3e6d60d99ece5730b0933 +size 199058669 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c29fc0cc11f01d4838c448250ce4903bd793b48 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4d76364cdcc3dc633250b0abfe63a5a035834adef057569eae3bea65b88b8f6 +size 199058797 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..10bae58ee7440cb628cae6277d1629923c929d3c --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2dc1bff9319979fe94e8c3634917327da9a599ab6dcbe271585b82b13c2e22e0 +size 199058797 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a573926b9b706703357bbd4ba0a8a432591de10 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:589626de302154fa950ce5ac5a685f716cdd5bff9e8f29c0a0c24c7d923e65c0 +size 199058733 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..45d46943a9796166ff33d4483ef7a9082ab6b988 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d38bc71958d5c150b08010758459280b6e5b2f79631539580d8949fb5a71ed59 +size 199058733 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..15be25965fbb9ba0f47591bbe464c969e7474306 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1421825d1f6cc8d785a40393c023a4d443b50e6c4a0b51a813786585c4d6af85 +size 199058733 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4da6daa210d43e3c9f5725027dbc351f19adc33c --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ea70483a297cc8e88a0b2bca5c90af94b7ba429d6aa795c7296a0b0c2f32297 +size 199058733 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b888f102e214d82d3b2a50592ae3f5e200d8318 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:971c196636d665ede41278d3cbd417f664097fefbe864ac793fc1ca7590e4ac1 +size 199058669 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eae1e99b6148c7fd1e984ccc113fe924822ca154 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf979f305ac90caa2a45e310b64df87e721002e3462994286cb78ac46f4f39b8 +size 199058669 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f58b1eeb25271fc10a676738de743af5ee0b669 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b91df9e53768fe52e36eea7e086e83ffb9b8f39962fd3650374ae2eac5c6ef9 +size 199058925 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..61b5886e9c013e0f26baba8da601ce44ea07d780 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:908b1ee2cd408bbb45d78b6275569aec7f884fe7b88f1c65487549bf1ee8a371 +size 199058925 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..14a6512ad54ef2c1b462fc397618dfecaa4cb7f3 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0269751cd8b5c3702532d0e9ea829395fb2635ffed60432e4af0ce12930e2d96 +size 199058605 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..88daa8090a48696b4d0b6df4a33d3209c3c71583 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76f819b629371828991de19dae99adcd9165d084e2c428b9f4bd3b9a9d15062a +size 199058605 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a5049ffefd43da61d26580a9ac0e575c3ddd758 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e152d26db15c1d4a99cf2061346949801ac40abf4dd1278f008b42b8da24dac0 +size 199058605 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2aec7fd7abd53090d8c5ba7036945a45f5c62975 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e40e630fbeff015106109e25298f8bf6aa1c4ea313d2616485c690f683567bf3 +size 199058605 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7723336a4724cb3717fb2f31c78c3011bc21fe8c --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:454aee3009b4c112d6884183f8abfed9339332fd3282f9c3c61256affcc343e0 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee5cf4fccb64dde11fa8b49b49ef3274e6dad98d --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab5137b9bf9b38d0d4eb503e4455cd40ec93fd06295d2fd5713a6001a6ddd120 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6210e6d37d9ff4eb2200fbcd1d3f6ad016dc59ee --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c6b05f8693bd3f682f70c94a2a9b7e05e3d3d148593c9255c52fb84894a36d3 +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d0393db392efe1b2755691ea60e7e481c8a09e2 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:030756fe2d381cfee73560d86171337c77ecd5796514e34918d631d249709b3b +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6fbd3958ced2440b2204eec67190d4068d03cbf --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01559ccf30baa28e11a1d1a953bea05dcbd55736764112fa1395c288ff69600c +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4241339ab87774be93b93bcd83271c0b3134f183 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d03827c5bdc2335a74215d73fe55ebe9ccce07734216a9cd14b5235424db9538 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..233b08a07131d220715b6088213bdc212d92a763 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8da6b279a2c6f10145fce6d1fcbd1f60d50ae18134842a51ed86cd2d94fbcfb +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..743bb73a31834da39030d8ee75abb2cf5eca5fd1 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cafb8b4cb01dda647d899b37d787f57da121511d688a489e17781ae44a1c038 +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9ea2d657b8dfabe2592822ccf3a0ed08c6bbee9 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faa4eb9eb8f58df359625645602d76104332951dd8d68e6c086c5d95e05e82a8 +size 199058786 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2ce7e83d21ab2ce4c8494b979361bbd575c648b --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:295822feff0a5a2f1b895da8e70ea44847f5d10ac834695fa7735ce00f02c079 +size 199058786 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4eaf955b8405b21855ac229b22f3f48a516bcbbe --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf014541b942f352aa1444bf95e2ef82eab6e4b0e3bc40a41057e087b91a4b6c +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20f81b695a441c5bad9e209e3e70dd1bc04d4ef3 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ad1dce2c184c85629e34a8b3fe045095254f2c128fc979423274f88969c811a +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9ac08007c2c61e4db54fc1230c2f05253baa699 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:915f1af9a0efa070797ca2e028d1bc9278d114ba5e712c592ef06a338ea73ea1 +size 199058978 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a867b1ad1bf41b04d460a64c4766be6260ffed58 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:749d8aff52de1b1645edb3f05b080932c38e07b7674283c6566336f76773c7ce +size 199058978 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..adb360d80fd4c2996649a3d203d49ce5f79b586b --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:721496d0f75587803e28ac1052fc2526ddf224c493ea814bd85e0bd3d45215a4 +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8010a67a8516ef5a9bceabab8ff04864269aa63c --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84455a6a434ec36372c351c44036ad13add21800f0c36d3a41756e302f3ba0f9 +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..736e6401404ffbabe5ecd38f7b7571155c8ddfb6 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da5be1c46f8954dba3c1873d46159aaf0bd8cac70375b772961e47d6a8153d34 +size 199058647 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1363721449566ddee398c1931e526e825bca85b --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a55b93763f17338b5b23bc875d4da733f0894dc4a1f6c115bf0fcde23a58bb45 +size 199058647 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ae2893e67613b29923211efa711fff443b3dbb0 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3ef317ff239119e98df480cff7ec15b8167fa46d16c2e1d0fb398f402002509 +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..719b5c5be1f5687250956c5cd682a3a7ec5129aa --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2173296229ea27f1716408eda2f545a5ff6c7eb192f3b4dbdf6ecc4e10b68c73 +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ee09a775b6c0ccb563f1e410bf780193ee54f85 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f314dd030cbac42c339b606a2a3ff7227ba4f5d566c88eb46b88daf0e103a1c +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..784e60a329d4cf31bcd6805aed3e8f957c0a8a80 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6b24cc50bc0cfb6db5698427cf13a3076a5f34b770e2914c8704e6da9c5fb51 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5dc4396847316fef31279100a264d10bf2fb78b --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00e922bbd0b7ed6ad150d77d0ea19c52ac099950f05573661e9abe38055a18fd +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3b795cf7339b55204e4260657ae8cd4273e9a80 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63869579c086f7119202df1e7ec9e768afc8f08f98e211bb2aac46b201d283ac +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d794955c8e37e4ba9ffec7f7cbfb06441a72191 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d10dd0847addb4c680ad36a8dd9c6600956ccf8b6715c6ac4e97b877c1f2e67a +size 199058786 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbd72d113f0239db681dde4729f54abb223fb421 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:938e3fb2d138a898a0e745ae9cfef7df464ca075bfaa32db7b0b6529b8bf1d35 +size 199058786 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ae640e8b89c1a1fd2b824d9dba08f731bf9d0b0 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a548bcda4b04ef0f9cd4fe11eca6f313baac55da96338a6f50d42c958f774ea +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4a230dde0c537d8230e3f4ae20aad01aa1fa3a5 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b72c746b951c814fbd0815f35b9ae148747435347ec5d830efaf44615799b9fe +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dca3e869b68957fcf1d5dbee569076d51f13ad48 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d241fb94b54907946329160571f265c5b0091b8f3794365bec5e418a5bea037c +size 199058850 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..520f917a52122eaae5483f82252315d02fb67c51 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4de43a7aedb740afde2107af3a47083ff9431da7f6eb362a002a0d66d0b0c39f +size 199058850 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ffb0ab47577c45d52792d11dbe2bfefe11d8829c --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:927e5c4e191b86de6d51cdc56ae3607186195475bd5374bd415ac48e6a5298f3 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd0e127151f36e02ffd02eb679520192583eba60 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:826426a145f236c878c80735240d745669a25d11cc282c316522b7b38448d0b8 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d31b32975df0722e9a5eab8213ce71eee880426 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50adbb25e81be4a162c3742be60b40ff74c71e2a1534a4c448fdb01ed8832c0d +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..49358c8390fbd3894be396e418423870c643e832 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a36b5631f1cfb8a2c7c6abd35478d9a61e1de75952a004351427354f8d66648 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..be968392929c90325a41b5476daad0c8adac5b1c --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6094730a20ca341ee96405bbac6cfdee4b998489f8e2140b40a3916efcd0cfb4 +size 199058594 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b23f0d957f8f50ad8bed4ca4797aff1da3780468 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:337ddf4277b0e9c7345a3f8a95a265f51f1e450237d39660e38dd7b325751a00 +size 199058594 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..980219ccb60d3e7f1e590b7cab4be3d613f31038 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5147ae069e033422c857b5e72005f86f438ad04fae426ec9ecb350bb2e78cc33 +size 199058786 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a15225fb6466e48b44a70be936b9f0013f56387 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6af25e8dffa0f7d62525584c6684dd44a1dfdb2b0e2bc0da6feef698074f31fc +size 199058786 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..69d4ab278ff8c7bb8c1a198fe3b408c46178bcc2 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0b3913c526a332bf982151b405c16d7e2d869012d642f253e4f6ee7b741b1d3 +size 199058711 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe9d7c46cc61392693b4e04e9b5faab5ea777824 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f574a70ee637a8d1bfed5f499cf828763a5c6be2f823becd954083af29aa427 +size 199058711 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3dd57efc8476d681195f3c0f32785219e8458e08 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f856d2db6f7dab5b7723ebc282e43e1031b105f16cd72e0427b039e6a4d82864 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d2a39ace8bea9d13de93323c23b1e33a669e6c7 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae2db037e05ccd972306228d3c30b1dd445cfb3d3e230fd95830be0baeb0aef3 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a12cbc9a9cf2ea733d20306733faa491956fc9cf --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b88693e6473d4154fa4467406ada11208ee8053fbb679672964071a742ca93aa +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9f23e93a6b1b8ec842850ee26ac67cd95437d73 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d13fb8820944373276064e32a858602a4674157bbfa6a632d88d0312a4934f11 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f7ff697f0a4cf6b53efd0d191a5dbdbe48e90db --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d36b8d146dbac4c9031467a60c4a1dfa15a395e49429d817f2446f1677f9ece7 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1db1876c6c097f67f98721d9a39ce0583b43097 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:399779a7059a598401af36704d5c1d41f0eb38ed0ef691b97b0c99558874b15a +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d88842ab38e06228f2dc9cb2b1b7a0b6012c92f --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4996b0b2e588ff796f40cdbf98b2048363bae7bfe80fe0b2da156c92662e8ba +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c91d88b95130eeee892eb8327b4183c6aafef112 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb9e0a842cbab7defcfeff1a3c120dbc212eace65c53e4d2b1b8dd8665e23e05 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9da754741bd7ebf52dad9f2548044960d7b3866 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:086f991a68bf85889aba38528790e60d3a5ef59257d0dcdc02ed029fe5ed0031 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3bbf8e944c364d50d617b7396cdf46dbfacc809d --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50478ac19471d30cc4eb735be3f77b3864c97216b21459296fcb12068379e741 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4145fe1b6ea51724d4a538a8d8e94a84e7d80417 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea2039c85e5d4d1efc22904d1734ee802d85e62ee43b67bcd0113ae4161e1a69 +size 199058594 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9c7270b0a2eda0f0ba1b1497f0243d9089332a5 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f81d6ce7b0303bfe60422d437cfffbfd0650f29456ac059f3c52ae1ee4854166 +size 199058594 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8acbc0d420a2470be4ce9ca9c0590fe4963b4ff5 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10dc0ce17ffea0e74afabe29f5a622fa5a882d805718aaa5acfa803f28ec8826 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..82f74d85cb087caa0949670278d887ff49cc25a2 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e99206dc04de728a5dadd5e10b5019c56244955b60ab6c198c1f1271b8795e7 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..416c8f816a2c4831e70e469ef15b0c30f35a0879 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15545397c4080cb7217dac179164a891be1066abaf0436cb7389e578da10b653 +size 199058786 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e97b24549f5759736998319a43241062e29a1ee --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1a11a030c1df876f0ddd49922ebef1220c7db08f7845ab449149e951f630e11 +size 199058786 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..33cf932a13d9c2dd4e20908c5578b0df9c558167 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:589a68de727801bcea348a84ca2381978ff9ef91cfafa41ce88ce671e4f43d95 +size 199058850 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d2577ccbcbb671fef3a2dd768c90d83ca78f9b2 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70b26419125108a8aaffa9a69ee8d8aed4ab1a1fc4a71c79cae7b5c24ab66ec8 +size 199058850 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d521603edc95115e402151ad8877a998de5b82b0 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8af18e0364bc308d94d458a6a82b595998d9a2b985aa684ec5f467d4855802e +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..48f46135ddc3906fd6add538d9d5d9c1a5f9b9f9 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f98323f60899c2860773512cbf0318eb55f07f151407159f1b5ef56891dfe2fc +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e33d969586a1ea718844cf336bd8bd030316fffc --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13a029b3593b4dfa6a8dc463aa9e0a07420c4049ca2e9a3b092996304311ab2a +size 199058647 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99b81b25d660f8746b7e2886163854f8c1762003 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cb6c7bfde91138e3115f5d6579623ae5178bab771cf5d75a2ff88a419c09806 +size 199058647 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c3483cd6560071d069ac6ec343ae5640770f358 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28b2f70c19b54e68f751d3d08e4f99f4fac4980407a1decfafa468e1c3758618 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f15b2dd032d4641e31ce637ddaec1c0688003c6 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0255de48f3d0b9e0c974095d1af4228c1e242464a54c05ebcc9750af5c83a110 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..74b42c04310f10ea2eb5e6e4596e92b17d0126e4 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90ff3948ce31631dff456b9269ad63ea53444e8be30c19813825489c72d70f7e +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e90ec1f02cee2db76b4880d68b17384ccdc38ed7 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddd3c7810a74eea4d36a0d596fd6f4e938645507a3d64115201ec970fa600dc9 +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e96c7f7c4433dfac5b311af53d896defd5dc5a23 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b2ada5023edd7bdfa4dc17fb5d3cbc6e7505fbd90d126e0a52cd4dd4a2f6fad +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..951d7af6b532c49cb3decfdc6eb88f0fe2d1e41f --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3962c38f04b996d69025bed0cc1c5d8ff8287847a7a3b0fe608b22036c0633c +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..24a5e084aabd1d4992440af39a699284995ecb89 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58d15dbcb0940043b400d4fbe16b8e0b88f3f7e06eaf1957a862efa10e31d81c +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fccf8cc4c9a6092f85775344addbf222ac5752ce --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41f0b4574ca132fb38b6ff2bf7f4b010b5d03952691e9641a716d81fce3b49d8 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..24b404b493ba9dff3554a330199e155086738a0f --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b1ea720b7c190e7a814311fe8f848f7afae680aaede2f518abed98229e1a1c1 +size 199058850 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..64c4cd1d983a65af479228cdebdbeb9f9e93d8fa --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee2ae4f5523d86a0c05732bb18da68ebe5d51ac52ba425bda4f88431562bb131 +size 199058850 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4294a136fcd49a61956ccbf83864c0815503a6e3 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74fe0481496fffe09749a30bba2fbfdead41f29c2f912500bcb3fcea7b3f4400 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..12b59057940d619d2372d80b26fe35daa83f95bf --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99520a3f6599ee5f48825d6d9ba858f1affed005d3f919f3db5d8eda4e7db792 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0dd18b7c416a61b239590ae043c4d512e4f09b2b --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18ec68ed8cfef45d1166b2bbfe7b45180b5d2101587286e5662a62fcf6049002 +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..31cb4a345203b2cae1533f9994cdad472d1d2894 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ff5dbe3a8aebbb761b64be82215f7898d2664a388461042bd6fd3cb37168348 +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c33d29badb8c77214a0ccfffd17be659a036501 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b02145ef3d1b4414a13052dbbfc3f69adf6f8e06a4897ccce4a51b7e6ebb81b +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f17d9376fe16130597bf8bae849a7fb01e554066 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e1ef59912ddb51140b15239c6d6f73c469808130946fa4bf2a2696b79d038f6 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a07f6b432b94cf504a1d37a0eabcef2ced0da138 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7144a38a02d4dbc6a7215689afde0607817df28be954ed2e78fb8c1d3766268 +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7eea9ad1f55b3061e910d3a1e65ea91281100193 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb9826d86b949907f326102651437e9fa4a7c08617da8c2c3faa39f77d932e5a +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..17c121a08cd7472e358adb698e19dc2079fb8f22 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fc40d19adbc4bdd09593e3f25541c9b69dbe423252cbd6855daa1886caa808e +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..22ff577df53bd822fba4de2d10347e026a6b28b2 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9d679ccc087be552bac21e32012d0bc00fc35c73a67b06515c1d42b1785eea0 +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d85ae1fb76ae05aebcf83e3512566464e647e62 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ade8d22260a7469fa7bcfe702eabf7601c2a44b6b478736669e5e0201f694d7d +size 199058775 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..968df37421967ad35c271784b721ab9c5d6f1055 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f660cfae711f3095475f4aff8a3c5d6dc6bc30875c329479e277dc11131435c +size 199058775 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b10a5025f26dec2fcb6b60111f67c2520e566d12 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9773759098743dcc6190e7591ddef4814ec83bf7f9a7a9ef306699c29010ac53 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3240f4d973a3a95c83734c157e246fef3ad991fd --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e9f35f43dadd9cca92d8e635c18049131e0f208c3f38bc7082bd570171fa2f5 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..49f5e6cba2f5adbafe598dc9cfadf907e07eb665 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d1889eed577ed5a80eaaf7708c09aa2839a785c2990f30552dba22f92674f87 +size 199058850 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b234f3cad87150a95b58f910c1872daa0b5f3e8b --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0495e478cbea4d7fb8e7c7115a12afd7d878c6191613bde9ab1fd9525c072cbb +size 199058850 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c45c6396757620814ed78955513896c90f2afc75 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:540b8d9a496e2c5d3092007a64a856df85aa84d934ff9a4ed35253ce684314ef +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e481458c115c3dc7eef90441b6ca2af05047980 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7491fe8274e8cffaa18c0c278f877f680efb537282b4343aaa15a344e0030559 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ecdf2a2573f78c64cf8e495bc703737db7a8341e --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dc33e696bddac86ba0f74f6b0ca3a7f2fa86e9d58a9f51ba5b645d6e5163a65 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b5ed9ad01d146e99180acac663a8f78b91c1a6f --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4e7d64610fbd5dbd837bdf29e809bc3e1f64729d5948c15e9df395a6f6059c5 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7ced1bcbe92029d43af28072b50367dbcfff5de --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72fc617441beb1892a91a40a3977d2df143b73222f6e7d3053225daeb3e539dc +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f04213e353d20c3f257557dd4c6277b251005f9 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6fa46ae4016efeafb58a9e279e61fa721cc129802ce3b0110919ae9363cf4ba +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77a53797ac89fca1018dc91cb0a68f3ad72d0219 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9aacbfbeeefa367a10aea98a7737849d90c4ec059793e647afbf2f3fa44086fe +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29c3123f614a4aa1173740d05477a2967aaa126f --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15621943a22e638bb08badd0506d8149f9c87b1f58400c65786a7ee61b518c31 +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d59cacc064a6da4fb7c78eb6bed462387096748c --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac788027dee98d1d232c2319054544a135cd6ebd5e90e044244783eb904ca103 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9e6decb9f876310cf67a565e1ed31c1c9b08c90 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18cd2ce688c2b77e28d8824c27d37be22bc23ad41c69c12da76106bac5241689 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e17f911b235a86fa1d3a65497fa555f11c54479e --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f49618bbad3d0bb5424725c966e76b52cea65528552e22278f03c60c2a05fd4a +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a83a4b99b22b91e2b500c6b5e6444f56b4a4f39 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90b53e23c716868f56d3f281224127026bead97297fb26d3697a468e077410e4 +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c033884aea06bdacc062942fba480c9d591de9a --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d51bec43733902799c2dbd2731670139b350d02b38b6497feee426c44f1370c +size 199058914 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..39ce43047f56b5834d2d1acd00f40f9f145d0b1f --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69b709168a863439ceadef094ed81a663180d097728385d1e386749d666ceb67 +size 199058914 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ffe248dc22ae7161991941abea95ba4f4b9379a --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ac8e3d7e57f4327a4c84c5d7da8e8d125fa2140944f9d7e8d6ac667fe784481 +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8288da90ce48fc1e4ba88f23524d194f276c346b --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeaf614f332d01cbd6b1657006d13005ee8214dc98940e50e0e1cbf7aa3f7df8 +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..22b28058a7b4ac1fff2b496a12fa74006ee60144 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faaaac0fc70f11475d3e0ed0d05cc953b12ec3bb4c6710ed7955a769f3b787e9 +size 199058711 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..04795d30b07f4a26eed165ece629edc8cdcc6bb9 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b01f3180735bbcedc65f3782bc1ec4f27d548dce667db75d052dcc4600a7ae5f +size 199058711 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ecaa4d0223e7411351a4fbb37cec8b64183ceb9 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b8b78dab60c72d3d4e0e0221b601dc0439563aee0c79e2aeb518a2411da6312 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dead9bec287568390fbd869938225ed7848efa22 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e18ae05debd3c9a146e6acccc97a99a00be5b075526f0930411cd3c60e11c83 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4812ea9a6e39db41a61234b6f7089c1b90f7b7b2 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e25b8f4b4c0e1bc69274504e48f60a584b9826046d07e9f5ff91d2791039f6db +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d4dd9591a00ec11d2dfe2491e9e979d1c4a0e0f --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:309051089f00846e650d77613d49b076ed113b1017eaa69252da0bb78c032898 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..21940beeb0feeb994508b76d5d864ae6d571e373 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26bd7997918a038fb815f21aa24a0e9e72ae9b976e9dd2e90ae3a732d6a54072 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6c96daea0467d3d653056acd58dd905c23fd4e3 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:834c5f3500d2e5be4bc481a7440288adde09307b92e89187855df983c8c015b4 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a86ceabfed1770e56ecff392ba9d5bdc36f524f3 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3f37b1e1a9cbf61782f9a236264145ce029cb1b0e3c1c25122e06c68bb3174f +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..936967572e88ffa57267f5c8f1f1e3453d923c81 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81dc2273cc6f217db10c1f436d615ad7f783843961aa7a7ab722d493995a9411 +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..795273668eceba63617abd3251d46dc04d61e958 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4d8bff80c5fa7f5a3dff2679101c2f0868ba0a17d0063dd59990f888db4d0bd +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7083dd3a4beffeff0c6d598d864511dece9cb5c --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c12fefec8ac1bb3a79a2c85be9518e9c3744b81770e8482b60f89270541662e5 +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7dd035fd39bd155058be538195e65ef869880ca --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f03d481b24bb743f0288ee8e528178f44244c087565572eae19107a8775ed605 +size 199058850 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a52eb31162e58bb238d2edf588aa9bdc9f32833f --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7cc6414c2e15577dd71388792dd8f3a27ee5847e83e1703a2579687e221a093 +size 199058850 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea0c04b9dc7cc0649350a2079f2ee9b2d0eb711c --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1cf3939438bde00b18f02733fa517b823e3ed57ac3077c78e0144a7e755b642 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29a10c8778fcb09989fe1d034416638b3bf5e558 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27c09e729ffe5116788fd43836477f296e95c096c45ae49714fb7092536cf930 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae15690661328e6745115469664faf89a461d2a5 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcf24cd8abff24befd248914abdba2129e4d8558afe859008c7d4022b1f9b230 +size 199058786 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c9f97a67e26a1b31849eb168f722aa156d348b2 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a35676d5100402a564d2dcf017dab026b9fe8a0f3418ff7099599384d3fd6d8 +size 199058786 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4e1c177dfd19d38ffd5b67dc328c09addddb8eb --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:489f47549410a494f7673f114eed3c77928637b8a2dd06fa26fe070b5c257dab +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..00bc6a9fa5c0f4467eedf2a31ca552cdd97db9e9 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a2f1cbd551278bd29c2b3838fdb242d481940969d961dfdab71813edc6abcb1 +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fcd4610e469933e1ac640c6deb78d86f8c7b06df --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:327e0407b84357df8bdb94e17cea0a740fc6443e5616ec518920681c45fdc520 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9de8d44b049bbb5365341549fdc6be5cd5b22bbe --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11e3e560fcbf08b3db9a98ff5987ee24b0678de8bd6abd56559a94e945187690 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcaddef606c5e30c1a514e6d2e9704931df23ae7 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af877d0943311fd021ff04b80fb4c0fbaf3151b983e5bf3af7aa4e10181ddbea +size 199058647 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4514e49de42b043320344af01d79e5a74bbeda76 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f8d4e7a29e5d77720e17c0fb76eaba4e0cc56c2f4844c065c0fe82c0e72d4b2 +size 199058647 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..572dbe5285233fcf7aaabfbfee977328f602d4b5 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5881b7b7f6233794cf34adeac4fbb94e71a71cf007b1ccb6a367324878dca36a +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e460208832ba6f1bbb30c47287d417d3dd9749b2 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34323e0fcc5a919f3c6f302048ce62d49565d59c1a470c98bcd8ac29999617fa +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a47e860bd6151077e19d5d3e696f10281c9529d6 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39705f2ec58e2fc81795233e99e0b77822a582605edb0584c67a8a742c8e0191 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4358dac507aacd0103534f845f6d963171a826d --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff8622ec67adc1345f91dc717a42303f4912f6a4635d10c6a9afb2fcdd4bb13d +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6867dd647c556765080419450020e9a67535688 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54d5a68b16513ceb11fd5e56ca165b90c6c37c3386c8d3c0a10a34562e1f3c71 +size 199058786 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e300bdb8957afe8e7c8f6fddd6090778c813074 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18e5231f08932383c9895561eca9897ba08056d1768d18158eee36f0ed7420bb +size 199058786 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..16550de3a200cbc519d83f59f6df89854dfa8e54 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4980fe4b62a875719bf27a95a3f644d1bec0602b5f93832bb8f2e6323e27437d +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3edb5827dafe192d5316a644faad1a2882ea2de1 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:453ebb8473de2be78d44099663dab93459e1b234090bc0d87fb438b045d69636 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..32922db31728ae6a17a32ee63056b298878ee9f8 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:909534043f983b0cd0ed9a29efe8bf6be3b03ea681b178e96a6585f1f73dbe64 +size 199058786 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cfbb6f6cf8d98bea5bb0ae6d8e66575d14f414ce --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88df1c153f10cf9af080729bad307edd0522434f8254ac5ee8b95371c775581e +size 199058786 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2c5c5cec9a75cbaa86ec4e2983179e43d11f336 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64712dc3edc01bb9d445a27476416f401615a00f554c5f3720740b90f1a909fb +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca8ecd5904327b675487db98f771616bc91aa6bf --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20d998bf60cadb18318ff428e867bbe93fbedd790b97b4034bc021cd6a223892 +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..161396f42485def6c572ad82168dfde1cd13b9c4 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c55a4b8151e9e0c2c7d8d7ec77f35435c9e44837eb77004dfddde1ffe118579d +size 199058786 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0dd5d7a64b836f10ff3b95d5c3f638792b52722 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70bc8012ec2b902cd2e87eeb73358fc02941778c20ec33ee3b0b02c00ddd4138 +size 199058786 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2b70656e667936fd06e0e1be88d596cf819438a --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f62e11f60bcce85e690f5c4194cc8d432f87347c0331122c623239c4a658d24 +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad5dc59d755736dbce47a95d73b6599ed149b868 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71d98a67ab580daf7bff9d019d32a55e0702c608017968af97fa5b975093065e +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1dc4104ee2e33a2edcfcd44627aeb86239a424f1 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e3d482d1c89254482eb3c5285b27de1c37db9d2324222a4b90c2e1c0ec99792 +size 199058786 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e396b309333b19e6beea40632aa119c221375712 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fe61c3efb8d86d9aabbde928bc01bd2a507d90d459cd3ed367d9f695ae812a3 +size 199058786 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d029e690e2cd20bb07b698a9592e2c94287b0fac --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef35d8ec45c194cb1ad96ddeb7d6598cdfdfcc82f76ea3e9091c6f3a2a183b04 +size 199058786 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6b710c935f32df42e41147926f36139efd3a5cf --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2eb66d097f6c7f6b88771253744cd9a5be4632b3acc1a1095c8668144a54bf3 +size 199058786 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3aa302ea0541997bf09f494737f5a775bba9c404 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb70b052174fcabb57b25e83d663351cc8ca71987e94d2926f81329cffc54cf5 +size 199058647 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..167dc37b496a7e88ef9f1f26528e904a5a3fa560 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1ece125f79675bc591afea38df058c799dc19d4d6769c95adb786f603f00213 +size 199058647 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..19d9021246efd453847d9b2b408cf3192952e8f7 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c43c878a79ed1725678d4db92ab1bb2ff8f8be14d8c31264239cce014d9fba0 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a772ce12b7c5963336912a86a69e0f90f381611a --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8422b1b5bd7939669f947c2c175bfd56455b2dcefcd79259654f00d837e6b59a +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dad20e7584fc40436fa1873a08b4e4fd9cd46eb3 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:122d4996022e2e28d7ac8027addba0910d8d322b75f55e08405340f13524cc06 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f366e374f7584cf49d9dcef4274a26d56ac374bc --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fce884839714a55a63053cfeb373299c67faf1a3cef77492fff88bf450b05589 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..94f219a0a30aee944ac30646ca6c93bbb55ec4f4 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:635d17857a06668ef7c94ad603d7165f7d4b66640ae3e383cf018651d991ea9d +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1e9c76509c7029d27e6763d9e5892a9ea73fce1 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce2a75644ea1cdb0bcadfd7ff48279526625dcc54b594d69730e82513ea7804d +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..caa8bf935475120c26acac3a61981d590cc6a727 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9169d1490fa6b978849cec317d099b25121e0b54e83346e0d41d22bfac2e4367 +size 199058786 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..41f4366b24bc03f7e43f7ea7045f6901a68277b9 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b307df2214a27882cb0022d92c90ea9e2b89ea102825431f1e3100b337de45fb +size 199058786 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba41789c2bcc3e45bf1adfdbc9b24ed5c34fe018 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:174408d42209fa58b08383c31976c77c180baa97f28555f0fa6b73255963e659 +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8cca34cf08963d2bafbd660190308aad15be7d3 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:916b375ca7364a21d6068332bd1e9d526fdc5b5e15cbba08bfac36a8dbe19b3f +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b29351972e3bcf905dde922619dedd7bb1c8eb9 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad00db927877c313228a9ef1901d06dc280bfc0069f22986b1dc80e2783fb0e0 +size 199058786 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7848625cdb159ec47c7965a2325a52f1a6f3515a --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d153696bd458d7616deb4b9ed66666e3cb4cad8eb800a91a58fe2e39f7cb5bf6 +size 199058786 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ef93be79e130b4b6ad4a540c48eafc0bf1c2872 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c9be1f0f157fc97c24addbd628e8eb783c1f230fe6d631056d70a4d1dad28fb +size 199058786 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c0d24b0bf0e51dd70bf9353a1586a70f614c48e --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:765e1bbafa4a83be8a50ef5ef5f640ab0e5b2ca5d9a4e36e3f8605c36ae7a572 +size 199058786 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d920dc9013cbc5e3645217347382a5b08747dc4 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9a66fcd6acebe4154c02c23e32504d0b7600e7547648e09dd2f5e63e8b5e6a6 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c1d2186a6e101bb2c3d27d45c3dec8161e6a994 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab31ae69aee6123341579caa9841108cb7df28ab321cc82e85e8a5d487ae1b65 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e421452fefdb569f89d6fe23d33f7f08fa664c77 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea5f24ebdf35e698507864ae259aff4b6a8567189d27115da974126203ab6f55 +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb27036bded1c15e185356bf160ac2bd53797cf6 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bde6c142d30e5d9f12aaf1bc6e00cfebba35b3b253b66ae7963afcde20b01436 +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b342022e4a41d168e55a958622b00c19db9c7a9 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:675b0c3ebc8736f62980d365ff211697e5932ad7690fccb86f2b46a8a6207abd +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a057ea3e11b0b894857f9e61525367efad02136 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f923cc8e31309e5e6ae61afaa9ce5e76e7b705cb341d3148e5b1fccc5d0a29bb +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..390e024717076fdbc4fffffc3cfc533bfb41bbe2 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4ae3fef4547857499238798aabd7d942fa827e3b7737af3ec8c0a0572f7fc22 +size 199058647 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b1956557d4622ac81f000c490302c1cb965e366 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e38e749feb3273659614cf038fc00903cec586d75cab71f4b005d5bdfff59a25 +size 199058647 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aaeb8cfdab875f5fb20f94ac5e4a62e7ff07c9b5 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0400a55daa2dc0611543f315f27f9e11ed895f61c0a3fdf37a96b70dcc4429d +size 199058850 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f47970d7cb3a88062588d49b1666019f0d9e9461 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c46f9944e5dd378cea8e78b6b01b0f178d2dd22000bdd8421b66626bccb431f +size 199058850 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..076998d8527d0b64dca6e9ad3e10f5be38a67593 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ceaf206e68e33dff48d582b60645e5f90cc24ac47269e832b1b93f264223e23 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..375014986da361ef57daca74af8d38cce10ff2f7 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9304cb1d3beea9e0228ac118837e681e46088991a77dad7065dda8f06e3f3ff5 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8eda8fe96cd3293aed1601c3bff2293f14411027 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e7e369493ea03de4fe5023a5c6a16fe23b2feaf7cfc64bf63cd68dab7471dbe +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..905d8846ad537de0d5a53c2a78cf30d5a905fbc7 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ad01fa5f2dabe98790c39aea1b4bbcaff791a639a6f26c125b3d81fc4a80cdd +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..19d81aa6e108a0e5b18ae5980e84254d6baef528 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fcdec8f3ecbc528f08e57ba39435ccb5592ac3f51ee687865f5dc7a4c9d61e9 +size 199058786 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c80e762c6d55b8c74469f88f89ea734eb5799d5d --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfa1f8cb4358f4b0a4a1cb4f1155bcc41507f9006fa788785e7e11b401000a76 +size 199058786 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3dc2af367327ee765ab1da6991f8972d8d3e9d4 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:513ae8d99400c6e7bbb636e9f24811be5738362ce2420caa09e4620deef135b1 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b00c27383f2ef03680fc62d50bfc1966e3d35e2 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e53b2ee7083a7f0002937bd8b7f0ef4bd271c8c567dea29bf24afa1afa991789 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..27bfcda5bfe4c2c8b9d65ed4cf0a4cd442e27344 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbf1405e124185a37f28d5dbc2f6ad84c559c7fef28794b9bccd7cba1a57b936 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..69b37282e82fdec61bfb5eec22970fa25fe8854e --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23406e45072f9f13a764c69e2f2d81d2a274b0921d84b18b4ed7e0ad1d958ff5 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8bd15cbf7201aa9d6550c21efd2d63c765c451 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:128238d22f6b1b5fe1d53c4f82dcafc77873e41f1efaedde7d8dae98bc3cfa15 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b575f5ebf8493aaba37d5257006d47fc4c668a67 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08e89bee7d47f490bddce6d75f95686866bfceff086678baa138fd7dad5ec911 +size 199058722 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a981a30b8dff1753b66419e66a584a26296c481 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c95707783b1ea2f5be94983cbfb5a49a1faac3755c0060f670e338acad4c5e76 +size 199058786 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..672d9cb760974c821930323fe55a9e4e4984d977 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25b1595baf8c36866100d269b203c2a0575af01847b7c5de4c4a4a41327204dc +size 199058786 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b25bcb920433350d363ad5801ff4ef3d9d08b454 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cdeca86c86a6e4f9af2f916a591f580de87c376f52c49ce0d275308f0087ffd +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fd036e46364326a9db92fa9f883cf16248bb2a9 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3f18b9ebe0fbb33bc3ce7950e7e263fdce63816d93e6b9fabef4fc09afd27ad +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7832c46c5af9dce75d2242d5c5b30050443b79b5 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f2a90a012e7a46ac3384e2f0900281704f36cb42dab0e450a055adb8c58c2ca +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..12447faa77fde2e2a6551a4bb8c52e7c4de82e26 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71d53b589c81efcc1e3fd0d024ee062be40d6f307f1a1366180aa52a559de097 +size 199058658 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..91b2939a88114626f9568f72fca22a5b0cac4f4e --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d95f7f8173c2f69800613be1c12a4657687402c0b30dca9bb467e5af1ac881ed +size 199058839 diff --git a/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6e7e9774dcc44fa6be9c481c7d48a4eec79f333 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af615e9a9e3d8e358fcefbf95f281c323bf6b8ab64776265ea252484c0e25478 +size 199058839 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_01-model_00-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec81ea7f45fd530c9cdec0f0ff3c2d0d53f1dac2 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aafd564ef90aeee58e842096e70b925a218708b5e2a0892b3e99fba6d9893fc8 +size 167511299 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_01-model_01-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_01-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..af23c007677accc41da384f804703f782355ed1c --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_01-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0c5cf368036d3c35f3411c1191ffd134cbd339469e505eb61d5d885ff06757a +size 167511299 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_03-model_00-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0443519e02e6a173a044a6148c501aed4d83f992 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef34b98a0c9306b06e86e3fba22b616f7ce41ce9c1f44d4331c6b7025912b15e +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_03-model_01-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_03-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d1147bd3ab79fad27962e1c1a97dab8721fdab4 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_03-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a3b39a42ebcdff8efccb715a5ce902c6522e2ac77488159d673baf3022948b9 +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_04-model_00-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..824794167278e91bdc3ca60480c9c4cb169fcf0c --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc1d3ce0eeed96480cc5baeaab0888a0a284cd91d3a6ee305d794595804afc35 +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_04-model_01-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_04-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..33f52df0fa1c3e03a2d6614b168045a242eec0a7 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_04-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:771257abecf732ab2a3f686ed2b0a170efa50b8fefef6aad9bb0ba3432ff2343 +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_05-model_00-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d56d0a720a310996dc1283706e352208a976b207 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6eb53f13c39c746f8eb1027f36f70754d217459c355eacbac4ae19cf9c5c04d +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_05-model_01-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_05-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09df034af042c7fb44645b1e884b791cd1a13b6b --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_05-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3bdc9cd5c7107ac0f813eb9e355fe46e43f9402a37e250fff398093d655f800 +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_06-model_00-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4232e510e76ba2645e1c35b2e17e92414e3fa52 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0de2bf4f6cdc78c2d7d2d0c63a86409da0168663f0176e458cdc0d131d6d1db6 +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_06-model_01-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_06-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9cb4c974335784f81607a55676a5a4d58129234b --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_06-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd83d20b98847d3328b66bb4aeeb383c50267acce5f48583256e2085cb8e7344 +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_07-model_00-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d85c030c0d7b97e3c157d5df45e926e993de0839 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c987181fc4d4b3746b6b19b23808b4d5c27a426cd5cecd3e66122a941501871b +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_07-model_01-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_07-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7223a73c72e47164638c0ac45b094f462e4e2ad2 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_07-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5948dca6ab76cac8f645bfaee5e7d80fed4aa4cfb2ef98aa3f88760a5f0e8c3f +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_08-model_00-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4153b01b85088a64c0334171b2c22e9a3238ed53 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bdb5ce477bdf61e1e9a21c990cba5bb831e183313c0883732f3e071096e4e24 +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_08-model_01-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_08-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e10177d6a4198183905749ac9e9ad61be7389b49 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_08-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8479ceda0bc9afafecf7b56404754060f120ce7453ddd05ad9cdb984934e1f8d +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_09-model_00-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..322f701352f2276c8aa228c735462a0406019311 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cb611cdee0c779e29122f6abc17610bca89699b6e79ed3b5e80ce4b775c0cc2 +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_09-model_01-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_09-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3bc49403949c285a4e353b2451b995a35ed3bc44 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_09-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0eaa952a0281deba0686ed7a75818c69037c5f7eb43d0c0f8f27dd94ab8c0598 +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_10-model_00-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..104e7a13c2232abbcec18bb9b404a89dce308e4e --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed1c69e62bf774606cf76cbbe8317eb3fa88141f6f37b2274cbdce4d04889f11 +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_10-model_01-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_10-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..529ac5e58b947c0c0b44af8305f71165724542a6 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_10-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ac23285f4b8856b4a6a13c46efcc8ec2d1d855659b112186608e1f16f31667d +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_11-model_00-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c69a90677f853b83a63d96090067ed1a594e65c --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8980bf5ba605d10c905d99124bf9efee06ba97d9998042610f3462fbbcc96a45 +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_11-model_01-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_11-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99e84b0f1187d94f8d9024764f9336f3ab798ba9 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_11-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78011d8ee619b487bf1469539dadbc1d7ee2779c97397e47df0d0e882f07d688 +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_12-model_00-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f146401a6bf8d99af0363ad7cbe7968d29ed35f0 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a67f959ea59a1e0603b42a66da1953110da36bcad8fad31047443cb93c23fbd +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_12-model_01-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_12-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d801913da5184c6d9a0c8f3d7d5e216de48d39b --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_12-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14ea5cd808ab87aa9b6e96444bbabe2d9c9106cf4e4420f9fb9e8ed524ab8566 +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_13-model_00-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..385162b8874f41bdb6bdbdd9c31d4aaf0c700c55 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0946c724514b87b92173e3508e18e72af46aba62c4b13165ee5201b678055ea3 +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_13-model_01-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_13-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..80fcfa46f2cc17d6099fd7c8fcc4fd959a41218e --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_13-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:794def5bee93f2d7d02b8c35901dddc8f243347bc37d909d273e6d550afe2eed +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_14-model_00-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..017e193da34e4731af37d053b07f74f5a2076c6f --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fafbc034c73b8ee09be490f54df18972879f414043389d3fa9efcbf19c3424c +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_14-model_01-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_14-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..73a8aded885cb2183fe8122788b9c77563923a44 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_14-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa33e44d63ee8ab5ba7119bfbcaebf8a22fdc691a7c756ca0c190e9e3e1d1333 +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_15-model_00-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8bfa8ab82ca9a171d0f52609b3aa55cc75636b4 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0e2bdeccb43612929dba28b81775321393a89d95be833b5a3d0bbcce189e81e +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_15-model_01-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_15-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..412cb78fe05c991fa3e9017c099f696aed2caaf5 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_15-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c54cf6ddbec96c9af41d2bd83f9a5a83e866844bf588c614a0691078be96916c +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_16-model_00-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..72e033a09ae1d47b07466669ddba95d1f07d37be --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d59350011d0da3b1f275a7f1b8814c93ad98f1aac90ed36b24f572ceec6b91aa +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_16-model_01-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_16-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b09ca645c54453df2ef6bc59c82c823e45df4528 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_16-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca6e8828bcadf92e7f7ffd035a14d233c6f60669f3e79bf95699b51b4d84ee35 +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_17-model_00-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..94022c058ddd7bacc8ba9d177da8a4cd6111d409 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0308785b9adf4e897b0fd45a8287018586536d1e41909890a0d2175cbe71c56c +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_17-model_01-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_17-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ecf71a169ff62f10e9e00b11f24afddaefa211a --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_17-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8457d63715f2a023ee1b62e7cd76d3a8a0defc1fc8f92e724620f836fcf70fc +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_18-model_00-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..66573a3ed50ba93ac5ddd3dd22c929f4575c30b7 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50b59065c0d9e5f7573bfefcd850af4405c5e491a6dff531b88d5538e1da3a8d +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_18-model_01-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_18-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca0d8d9a080405e985aa6301964dc502ecf0f129 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_18-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06576113dfa1954737d154fce416cb776f0baba175f4e3867e7547ea6fee9767 +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_19-model_00-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c5da0fb32c413df4b36323f2da6ff5a21a415c2 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55fd4595e574cc17cb60063ffb58865e0aa8492dbc820a3dcb5783b5e4ee4fbc +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_19-model_01-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_19-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..126fc23480eb9d6f820b7fa102821dedfa5f76a2 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_19-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fa9810c66e873f1e47aa0283a6bfa9144b3692506ac08b94ebc74262d489c55 +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_20-model_00-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4583e7585cff5d8c3524183b933b5aad1da9538a --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5da592f54f3e64e8a18e7e3e266afcd64d083d4f74f428c6a17e58a924de1f5 +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_20-model_01-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_20-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fab290b24e75e3f71bb1b1300c8151b2363276f7 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_20-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b47c1becf1ef8d8de9eb37b57771e6cd60ca9931ced62f011ff3223258e96c3c +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_21-model_00-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a678fe037059146797aabd684df4f61f59a0729 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe34a45f6787ca66dd359a0093035fe27aa948029c16fdcd355f6a916926483e +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_21-model_01-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_21-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..43d35d65a21011734efe48d8af0457849eeb6112 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_21-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a943f1c7424791c1fafaf51a3745934954d85ca2192dc75a17ae4e149ccb306d +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_22-model_00-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa26e204d55412e4900630dd890836b6afa6538a --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d5876e1a4066dccddbb261c8bd7a9ae8e83bca8d67890fa5bdfb9e8047117a5 +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_22-model_01-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_22-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8fa5c7b6a5f1737f4058457a3d5b996e85326a1a --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_22-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e799ef24e9ea48bd8eb93097ea0e9cfcbf8153d04d90c05ea19879eb24088475 +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_23-model_00-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..85385d3fc1540ce65f558bcfc42f6f724e25ae15 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed7a50dba1468f7461bf70cae1c90b5b38366d52ae095cebb76546eda8dd377b +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_23-model_01-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_23-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9deab1de0cce7bf3ec2c1a8c514a7b7da1e1b9bd --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_23-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec464d4e97b09b6770229dfcbcf60b76b54a2b36e7c6fd0877477974e3c44e8e +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_24-model_00-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..15ec26dfde2ddace3dd593bb9dd6d930801c1385 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a1041d8a9d32fdb76e62eda054eaea7901a3bbf4b5f6bf2292c83c77eb1a5a0 +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_24-model_01-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_24-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f0ffa56353083015d3994f80a48fdb5c4f8a22d --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_24-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:022db030886b7ae5861138748f5d6d206be62bd91cf3c1bb4765721c3ec4760d +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_25-model_00-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3bb0dd864f43697f5405bfd458b0cfabe651ee2 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d6197079fc2e4c47a8424b5704249713511fc1c7e1a329daeca851ac81a34d8 +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_25-model_01-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_25-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..633fa5356692da48b9fc6f009a6caac8ad75c628 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_25-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b94fc1ee5221fe4840f8837d06d670b1e24d67c33f62b47f40d53c55b2859bec +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_26-model_00-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd04ec09591d18ced6c9d1be78e704d137e59958 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:829242ecb0bb76c3417ea1b689ddcc4f8c491a7878676ed4b3480f140c139178 +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_26-model_01-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_26-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd273fcfd2bc4ebca65df073cd4cee774d04cd9f --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_26-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d52d44b873418bd5e67860fb744dccaccc1974bc752286742c381ebe753961ad +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_27-model_00-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..adb6a510fee4c2790add03862faa4cc6247d2383 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78b546e7f2edb4240b20603dcca5650a399741592df52065508fbdae5dabef62 +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_27-model_01-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_27-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad629159552aa5821a8cb189f8e0ec5e9d763eb1 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_27-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aca2d95d06da330242c4b8d859d8746d74f10745442ae140cc4781bf84cec64f +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_28-model_00-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef5d994cff964265197ffe247fafa81e8fcf0ff7 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:323fe626a5f58f664c6a3f9beff81edcfa4ea43de0008283dd95248edb06990a +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_28-model_01-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_28-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e821c17bca03e162606a3595c57ccb3a34e061e5 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_28-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6a1a0810aac306ae4c48cff2a280eded65fead1ddf17cd7dc594562d3c6e124 +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_29-model_00-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_29-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f37218b23ad959a3abc4ba2e31415e36058e84b7 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_29-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66b49804304dd66c7694f9f28018ef1cf15f240e28129a1c2360a429874dcb99 +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_29-model_01-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_29-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f810465df2f3e0e31cfef165cdbe55de8e84c9d4 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_29-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7ddf74e99f5a0997d16e337989df1931053eb16c7301cc03ca72011e9af38eb +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_30-model_00-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d66be9d4a34491fec79154725180a7f645221bd1 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58fa14284386cb44dea30ebbb6c3c76a84c5e91e4f120d213c8533ff006ee3e6 +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_30-model_01-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_30-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5e1907e578eb390ff71bdbf9f45ef16adfa4564 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_30-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e85dacff47694c3a63dcc786481f3b0f69c925b62a3f916587922131049d865 +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_31-model_00-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_31-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..10daad16e51b04d5d64e6e2a2ca34c3c43fa6ca0 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_31-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dfb2165970d1a10a0035df2452c83075f8a79c46d297ccca86374b85fa06a8e +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_31-model_01-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_31-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f307121169edc1cb94bebeb29d9fc47fccd22661 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_31-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c032a5dd60d642cae8f8683ba870be6d0a7eda6e50a4b04edf810c31993aa7b +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_32-model_00-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_32-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..abee4da3ec4e6768d782e6cc5615d20149ea57f7 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_32-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cd94b1bf0ba1425e5952a2cb89e11d265f96fe7f7526365a07b9d74aa795d81 +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_32-model_01-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_32-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..66890eacf5d3f18fe83ea50184c797f824543c39 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_32-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f726aeb4da0366d9eeb24356494a0c6624a9f1a28bcb00e48235a18fc905d33 +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_33-model_00-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_33-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..345bb5f15f76145b8d4ce9cab89734ef8333bfea --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_33-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ec5ccbb86d7bdb5548bc536f27ca1d8a6b21eb52a148a7fa8bfefea7a90018c +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_33-model_01-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_33-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2c0db4f10dda53eefbbd2bcf5c23d7c3f327649 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_33-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12fee77b5240df8e84bc34738bf79ae62040f19566fae7eb2065130388797fb0 +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_34-model_00-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_34-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..045a8ab3467bc1780cf9e05eaff9bba81c937381 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_34-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1698254b5b471caec13eafc0e732073cbf3e8598a2438196e604e5902c57e512 +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_34-model_01-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_34-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d15ee0b0f7db5e090a9fb7af5a6173b17ee048e --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_34-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab726496f53277b5e7a0267aba236ca58a8530628502ae7596793befbf7af119 +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_35-model_00-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_35-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..774124aa8d4a975441fd07976ee4e27f02fc6a7a --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_35-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9556b21aec1f6e08e7a615b61e47ab52916d8fb55a844bc379b609fe31e8e908 +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_35-model_01-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_35-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c452da227ca72d407519308cd89939cec4f318a --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_35-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29e228d2845d2e952d3eafb698ee6ae1db889882da5dff1dc437de3216f5253d +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_36-model_00-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_36-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..001539dc95ffdf6005db00ff771305ccdd625856 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_36-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:967bf6cf6cbaa00677cfe29908e753c32c10053da59879a94cdf55092940d3f1 +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_36-model_01-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_36-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..00f99d21a391b0b18f39150fd011a36b055b5e20 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_36-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77ceec1e7ffb1b6154bb279e22743c7c219550f8a94517aaf921ee9fcecb9d98 +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_37-model_00-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_37-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..47df36106ad96a5bf108889ee2c1c36687b67c5f --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_37-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9461662013563e1c43707a095d837ea3509a7d064bd3a5f734e6b202e0efcc8a +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_37-model_01-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_37-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f0647e47f458121a0a9ff7b90bd0529b2b18c97 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_37-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9c1ce55e7a8a48f440247d50cf06ed253a41b5a51bfcee7775558fcdcdc6795 +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_38-model_00-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_38-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bfa8f89ea13614ac46daf76585d20c4b9e1dc7d --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_38-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edeb8f94b13db73bcb631843aab82bccbbc08cc453c55877d8e3713997020d07 +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_38-model_01-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_38-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba5ee1caf6f6b9ac7f725ca957be5dac681db1f9 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_38-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e11b43cb0ab0c9cb64651f4a5268dd2cd356192ce2b06925ca7a2be035d86af8 +size 113308931 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_40-model_00-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_40-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c45ca7f2762400c8fd15446b2c48989c76724e64 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_40-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:918db5a656880ef5f1a4f00ffd30a7c4f3f3fcea84bc1be108029af96e6ef1ea +size 13507 diff --git a/4b284b84bc4v2seed4/global_step80108/layer_40-model_01-model_states.pt b/4b284b84bc4v2seed4/global_step80108/layer_40-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1ece38dce683f8a1a6c4704689c99b4f455bcaf --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/layer_40-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b7f2616b8fc99123291bc5c20d147dda5a868c81e4ff8e70f6ec7b38f651edc +size 13507 diff --git a/4b284b84bc4v2seed4/global_step80108/mp_rank_00_model_states.pt b/4b284b84bc4v2seed4/global_step80108/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..48c512c1b59d18f9b26f1f0c5bda19452f70d52f --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fb8d240188a13481f9f4cbdb8fb3ffada3ae12684bbd78b0e9f9239e4de0473 +size 51443 diff --git a/4b284b84bc4v2seed4/global_step80108/mp_rank_01_model_states.pt b/4b284b84bc4v2seed4/global_step80108/mp_rank_01_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..46d544e180d342447772d712af102bbaa106cec5 --- /dev/null +++ b/4b284b84bc4v2seed4/global_step80108/mp_rank_01_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:403918a35e2af9d0dcc1464962feb9790800d38af55af79d2574b045905d1ed9 +size 51443 diff --git a/4b284b84bc4v2seed4/transformers/config.json b/4b284b84bc4v2seed4/transformers/config.json new file mode 100644 index 0000000000000000000000000000000000000000..df814c3a71ee49044410636b5eeb4f43611690ba --- /dev/null +++ b/4b284b84bc4v2seed4/transformers/config.json @@ -0,0 +1 @@ +{"vocab_size": 50432, "n_positions": 2048, "n_embd": 3072, "n_layer": 36, "n_head": 24, "n_inner": 12288, "activation_function": "gelu", "resid_pdrop": 0.1, "embd_pdrop": 0.1, "attn_pdrop": 0.1, "layer_norm_epsilon": 1e-05, "initializer_range": 0.02, "summary_type": "cls_index", "summary_use_proj": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "scale_attn_weights": true, "use_cache": true, "scale_attn_by_inverse_layer_idx": false, "reorder_and_upcast_attn": false, "bos_token_id": 50256, "eos_token_id": 50256, "return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "tf_legacy_loss": false, "pruned_heads": {}, "tie_word_embeddings": true, "is_encoder_decoder": false, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "suppress_tokens": null, "begin_suppress_tokens": null, "architectures": ["GPT2LMHeadModel"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": null, "prefix": null, "pad_token_id": null, "sep_token_id": null, "decoder_start_token_id": null, "task_specific_params": null, "problem_type": null, "_name_or_path": "", "transformers_version": "4.25.0.dev0", "n_ctx": 1024, "gradient_checkpointing": false, "model_type": "gpt2"} \ No newline at end of file diff --git a/4b284b84bc4v2seed4/transformers/pytorch_model.bin b/4b284b84bc4v2seed4/transformers/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..fbf6cedf62c937f4fc39af3f63fde600dcc6e45d --- /dev/null +++ b/4b284b84bc4v2seed4/transformers/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b549adf2afe6fb7e617f16a577a43a9c75ff09124b8f8bb945ef0e236625e7d +size 8781203669