diff --git a/3b_layer0_mlp.down_proj_input_reasoning_representation.pth b/3b_layer0_mlp.down_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..19b31f8f3ce49b668e1d3b64daf5b59adeb5df79 --- /dev/null +++ b/3b_layer0_mlp.down_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f820734b2bfbc27026c6b67f96930657a5def8f4bf888020cb4b7e752fea5f57 +size 246892103 diff --git a/3b_layer0_mlp.gate_proj_output_reasoning_representation.pth b/3b_layer0_mlp.gate_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..2db19bbbc724c4ad0abee2c6092b83a54cc3f5dc --- /dev/null +++ b/3b_layer0_mlp.gate_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e8bc3df38cfacd84b797a28579c459b1a488fbde5c4dc7ea0930f510676da83 +size 246892108 diff --git a/3b_layer0_self_attn.k_proj_output_reasoning_representation.pth b/3b_layer0_self_attn.k_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..35ac7909d112cd6350592509c843ab3a5728dcb1 --- /dev/null +++ b/3b_layer0_self_attn.k_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f74220ceeae06af929f018d017c17e8166d980470108fe1411e53759741aca94 +size 30862939 diff --git a/3b_layer0_self_attn.o_proj_input_reasoning_representation.pth b/3b_layer0_self_attn.o_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..8f80dafcf6fde1ede44eeb0631f279f4b6142d1d --- /dev/null +++ b/3b_layer0_self_attn.o_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eae3e21f64e5f54f19f123d4950badcaf3fe3c0971186a6a375e6e351699a524 +size 92585558 diff --git a/3b_layer10_mlp.up_proj_output_reasoning_representation.pth b/3b_layer10_mlp.up_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..995d35ef0525eb6045142c82c1de5c2d83b4501c --- /dev/null +++ b/3b_layer10_mlp.up_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:511e9256ca00352e4b2694bf71f2636b54fa548634145f9fae270a5cc5ffdf6f +size 246892103 diff --git a/3b_layer10_self_attn.q_proj_output_reasoning_representation.pth b/3b_layer10_self_attn.q_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..dd84003e476c0dc423d9734e84cfcea2ba1cc1f5 --- /dev/null +++ b/3b_layer10_self_attn.q_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f47d12f95c98555ed4cbc1eb8ba506e7901311b9107f6799367d99e4d6efcaa +size 92585568 diff --git a/3b_layer11_mlp.gate_proj_output_reasoning_representation.pth b/3b_layer11_mlp.gate_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..3661a7675d5f443cde1e82c8e8c56153c2296b25 --- /dev/null +++ b/3b_layer11_mlp.gate_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:159d951bc7f83807ae800c4cd7026822f61c2a670a264908034aa5c5470419bf +size 246892113 diff --git a/3b_layer11_mlp.up_proj_input_reasoning_representation.pth b/3b_layer11_mlp.up_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..be0496397d663ae641cf8eff05bb6673314b0a76 --- /dev/null +++ b/3b_layer11_mlp.up_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c53a1586d9a2e1ced4a248c926056aaae6852cfa4759b26d8476e5c11287fc2 +size 92585474 diff --git a/3b_layer11_mlp.up_proj_output_reasoning_representation.pth b/3b_layer11_mlp.up_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..9f745413919612cadc17a2b65868f5f6b1a929ca --- /dev/null +++ b/3b_layer11_mlp.up_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f311c278b2d3eb6e2ef8dc25dd24c13d2202eb0db70d482f29d56af03c26feb +size 246892103 diff --git a/3b_layer12_self_attn.v_proj_input_reasoning_representation.pth b/3b_layer12_self_attn.v_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..83aad84b8beb7b1dfe681ebebdae256696f57a5b --- /dev/null +++ b/3b_layer12_self_attn.v_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:329d61088666c2bc9e2700e845661c6c7b4be4efaa6ba7049f3d914fc3295150 +size 92585563 diff --git a/3b_layer13_mlp.down_proj_output_reasoning_representation.pth b/3b_layer13_mlp.down_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..a9e3073379c51c404938af511aa2660db3198984 --- /dev/null +++ b/3b_layer13_mlp.down_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eecf0f6bd33df134f89ebad0f9a15c42f32532ce666ba696ab21b40219236e43 +size 92585553 diff --git a/3b_layer14_mlp.gate_proj_output_reasoning_representation.pth b/3b_layer14_mlp.gate_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..d825b23a7a6968190c8214d931fa2c708324c5f2 --- /dev/null +++ b/3b_layer14_mlp.gate_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ff06a785f65f8787b82080eec32bd526f301fd877fd5875ab2e90d27a5851d8 +size 246892113 diff --git a/3b_layer14_self_attn.q_proj_input_reasoning_representation.pth b/3b_layer14_self_attn.q_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..7bb665f181acf1b6996ae992c58a4f02ee9e5ba8 --- /dev/null +++ b/3b_layer14_self_attn.q_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57e6a0b2649b04b5366a2632d09281b945b791a99e666e661269bbee4e8fe26f +size 92585563 diff --git a/3b_layer15_mlp.up_proj_input_reasoning_representation.pth b/3b_layer15_mlp.up_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..83d465cc91ee0fcc300941b1586ed9bc7ebac2a5 --- /dev/null +++ b/3b_layer15_mlp.up_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71e0d77970a74cec4898f949929d2f9e9bc8dcc1c01ce863ec722be43a73bc57 +size 92585474 diff --git a/3b_layer15_mlp.up_proj_output_reasoning_representation.pth b/3b_layer15_mlp.up_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..f268c81a3062594f9e69463cb95bb7411c6902d3 --- /dev/null +++ b/3b_layer15_mlp.up_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b8f7c22d1bb998a5cd419c73fbc8c15403543e25cfb2d5d1fe8aa0800618e05 +size 246892103 diff --git a/3b_layer16_mlp.gate_proj_output_reasoning_representation.pth b/3b_layer16_mlp.gate_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..fce0b5b9b525ccbc532ad60acba81512155136fa --- /dev/null +++ b/3b_layer16_mlp.gate_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23fd6ab6295488797556c27fde514406a2abca0f71710dfd5debb4a320eb28e2 +size 246892113 diff --git a/3b_layer16_self_attn.k_proj_input_reasoning_representation.pth b/3b_layer16_self_attn.k_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..c9ca635df7db8bd9750277b910fbda722729f148 --- /dev/null +++ b/3b_layer16_self_attn.k_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2379e9f3bcebd0ee0c26a18ba022b400c1f485f21becb961d9b4e66e2471bc2c +size 92585563 diff --git a/3b_layer16_self_attn.q_proj_output_reasoning_representation.pth b/3b_layer16_self_attn.q_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..633b45511806eba9e67f2769149bc3ecf8ed6ca8 --- /dev/null +++ b/3b_layer16_self_attn.q_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:228c8a5efd5fdeb0c2a3a818e899981cd5d5326300b91e85eaf740b162245129 +size 92585568 diff --git a/3b_layer17_self_attn.o_proj_output_reasoning_representation.pth b/3b_layer17_self_attn.o_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..8cad1af8773f58766f6e14f507c59a63b9287e8d --- /dev/null +++ b/3b_layer17_self_attn.o_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f1938b555889adf63e1cf5c2365c56a13590efa57e9b536ad25855d34de37e4 +size 92585568 diff --git a/3b_layer17_self_attn.q_proj_input_reasoning_representation.pth b/3b_layer17_self_attn.q_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..573473a202694911e619cf8fb838e42d22cd7fa9 --- /dev/null +++ b/3b_layer17_self_attn.q_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bbc3972856e3e83ff01b37989cc1c94812d76ea4aa95003ef9b43e7da50bf82 +size 92585563 diff --git a/3b_layer17_self_attn.q_proj_output_reasoning_representation.pth b/3b_layer17_self_attn.q_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..6f8632f85804942adc6483e13d55162890e9f778 --- /dev/null +++ b/3b_layer17_self_attn.q_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a02673f56519b1fd28d44392193360eeddfc6a4aca337a562bdfb38b825051d3 +size 92585568 diff --git a/3b_layer17_self_attn.v_proj_input_reasoning_representation.pth b/3b_layer17_self_attn.v_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..19d91f753f5531761ebf619b8da8b89adf71f66b --- /dev/null +++ b/3b_layer17_self_attn.v_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c00df5a22e252522233bde46939d22fd43d55eb275a5e4e3aa6a0970d8a2ffd +size 92585563 diff --git a/3b_layer18_mlp.down_proj_input_reasoning_representation.pth b/3b_layer18_mlp.down_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..1031df49da2ea7fa727f0e110cafd5b141fd5d2a --- /dev/null +++ b/3b_layer18_mlp.down_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfc426cbb21491bbbdb017b73e4ea928ae8af2862f845b7a2466c4972fbb9e0e +size 246892108 diff --git a/3b_layer18_mlp.gate_proj_output_reasoning_representation.pth b/3b_layer18_mlp.gate_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..03d34c4f2c710d9fd64a4ff74ff728d42f3d53b6 --- /dev/null +++ b/3b_layer18_mlp.gate_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9e59394d96230f8f3dee9be92b56c9a0ccf4fbc3088fde56ad9b8d531dce63d +size 246892113 diff --git a/3b_layer18_self_attn.v_proj_input_reasoning_representation.pth b/3b_layer18_self_attn.v_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..484168ab2d6a55c411eb77e5b9b109ed01eb5fca --- /dev/null +++ b/3b_layer18_self_attn.v_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce10b75bb38eb88610649309f872036e0a5744f077f480bad3607494d98cfe94 +size 92585563 diff --git a/3b_layer19_mlp.down_proj_output_reasoning_representation.pth b/3b_layer19_mlp.down_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..48c24850453c829729dc16aad0ceea578034a614 --- /dev/null +++ b/3b_layer19_mlp.down_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:932e24c96cebc00be18fffb0743d4d029d5e83ea6001c9ca821efbfc6778b10a +size 92585553 diff --git a/3b_layer19_mlp.up_proj_input_reasoning_representation.pth b/3b_layer19_mlp.up_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..52bf371bd73e04e17edc341f0dc2892db2afa974 --- /dev/null +++ b/3b_layer19_mlp.up_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a32f64b7e6715f613f893ff25463d6ff8857f1887a33d8a05d7c42aaf77524ad +size 92585474 diff --git a/3b_layer19_self_attn.k_proj_input_reasoning_representation.pth b/3b_layer19_self_attn.k_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..b0d5df26d47fb00bde3b37fdfe4c215d9b93a54c --- /dev/null +++ b/3b_layer19_self_attn.k_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55a46229e9927cb8abc2f58da4ae2473c400c6d6ef7532574c53deeaaf2cca75 +size 92585563 diff --git a/3b_layer19_self_attn.o_proj_input_reasoning_representation.pth b/3b_layer19_self_attn.o_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..b13b156896784dda0be1054d225482d2f7afbd86 --- /dev/null +++ b/3b_layer19_self_attn.o_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96b14ffc45bf393c7b27b3632811ac460ac3ef65692d095a592688853074d0af +size 92585563 diff --git a/3b_layer1_mlp.gate_proj_input_reasoning_representation.pth b/3b_layer1_mlp.gate_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..93426dd4b46f2deb6217ef7c6aa2fb7b67b8ad60 --- /dev/null +++ b/3b_layer1_mlp.gate_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e897569b4dc6d28e999f5797856e97cab1910d3921c53564752f3a8df78a0572 +size 92585543 diff --git a/3b_layer1_mlp.up_proj_input_reasoning_representation.pth b/3b_layer1_mlp.up_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..dc7963841ee136ff4aa95186c2a2c4acc7d51cda --- /dev/null +++ b/3b_layer1_mlp.up_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e6bd60580bbd6d55e48ae262cef17441f4938bd05d2f3f9563fd81748547f34 +size 92585469 diff --git a/3b_layer1_self_attn.q_proj_output_reasoning_representation.pth b/3b_layer1_self_attn.q_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..254bf1d067cfd908170bd44579d4eae3ddea43bb --- /dev/null +++ b/3b_layer1_self_attn.q_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfb58d306b37eca00a7f1a08d1e8632e93666e152673cab5c1089955b4a41aec +size 92585563 diff --git a/3b_layer20_mlp.down_proj_input_reasoning_representation.pth b/3b_layer20_mlp.down_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..ef97239cffee4a8955cc6d04d606ebf1bfad46c3 --- /dev/null +++ b/3b_layer20_mlp.down_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e5f04ab97eee932d412bc0814613aee163bd60f1eeb40896a20776a22f676f5 +size 246892108 diff --git a/3b_layer20_mlp.up_proj_output_reasoning_representation.pth b/3b_layer20_mlp.up_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..a33b02d70da4739cbe7f45a6fc7445f26271a86b --- /dev/null +++ b/3b_layer20_mlp.up_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:322aacd595c80b827ce83705c082b31963ec70dcffd8f76eb0b144b02eb5650b +size 246892103 diff --git a/3b_layer20_self_attn.k_proj_output_reasoning_representation.pth b/3b_layer20_self_attn.k_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..d654f1b320eeabb226e6c9c1a1e44410044ae7f5 --- /dev/null +++ b/3b_layer20_self_attn.k_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b9eae70348bebf814b5c9b5b60d85e68b7d750fbc0c987e6c75c3f1694aec4b +size 30862944 diff --git a/3b_layer20_self_attn.o_proj_input_reasoning_representation.pth b/3b_layer20_self_attn.o_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..d5174908c88b64a1aea8c5766c765f20b735228b --- /dev/null +++ b/3b_layer20_self_attn.o_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b667ba124afc7c39bb9217ef99849a1669595cea39e28e99a20c813abd72b53a +size 92585563 diff --git a/3b_layer20_self_attn.q_proj_output_reasoning_representation.pth b/3b_layer20_self_attn.q_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..2c395d736b26466cedb19ef39e4f15c5e71e405a --- /dev/null +++ b/3b_layer20_self_attn.q_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d0aa594b1d5787bb01a7df41998afd99239022ebfcfe5531b3ea8d80889af99 +size 92585568 diff --git a/3b_layer21_mlp.down_proj_input_reasoning_representation.pth b/3b_layer21_mlp.down_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..308d82ab77664314767365171fd3831b67d2d2a7 --- /dev/null +++ b/3b_layer21_mlp.down_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dc07212125e3a2c57fad8f5f83027f287de844743f947e67892ea99dcf7ce91 +size 246892108 diff --git a/3b_layer21_mlp.up_proj_output_reasoning_representation.pth b/3b_layer21_mlp.up_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..04e616c16655283285918e8047396d5a8337460b --- /dev/null +++ b/3b_layer21_mlp.up_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd11bc0fb0f75c6bab582b92e24459f54024f6ed407e3d6d774375c3d6b03234 +size 246892103 diff --git a/3b_layer21_self_attn.o_proj_input_reasoning_representation.pth b/3b_layer21_self_attn.o_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..4c27685d6ee3ef00f3d7045d7593dc898b52328b --- /dev/null +++ b/3b_layer21_self_attn.o_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa929671e9be034afaebcc093a43b712f9a0a6ebd7715c9dbea7760475919d79 +size 92585563 diff --git a/3b_layer21_self_attn.q_proj_input_reasoning_representation.pth b/3b_layer21_self_attn.q_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..c6a15ffa2747c2ad5b02fdab385df209c31df0bb --- /dev/null +++ b/3b_layer21_self_attn.q_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36f25dcae31c6c828f794f61ac4222f7f566e1f50e64c5a4030b07edee7941e1 +size 92585563 diff --git a/3b_layer21_self_attn.v_proj_input_reasoning_representation.pth b/3b_layer21_self_attn.v_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..019825078ecf89fb72d42d49f86f49837d90581a --- /dev/null +++ b/3b_layer21_self_attn.v_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a1d5c441a96ba3de5ab5076c9c625002950a62c8b3234c9dd142c4aa9ff2f05 +size 92585563 diff --git a/3b_layer22_mlp.gate_proj_output_reasoning_representation.pth b/3b_layer22_mlp.gate_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..5f26ba8adedb2e5a3da1c7a83f25c16d897acb76 --- /dev/null +++ b/3b_layer22_mlp.gate_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e43fa3d75212670d5762b9c3b4de0b8ef98945162a1e2991580193e034f70f31 +size 246892113 diff --git a/3b_layer22_mlp.up_proj_input_reasoning_representation.pth b/3b_layer22_mlp.up_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..a02e491208b8efae34797c14d5206e8690a73bdd --- /dev/null +++ b/3b_layer22_mlp.up_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0da7ce23c07755809bf7f20f5b295b7f714ef484e74a2b06e5e1b4980abd0c5b +size 92585474 diff --git a/3b_layer22_mlp.up_proj_output_reasoning_representation.pth b/3b_layer22_mlp.up_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..df4dd03be349f94d9b8ead9b6d7f4fef0bb08152 --- /dev/null +++ b/3b_layer22_mlp.up_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b3d2cdc342045f719b5761924c8cc5780002d4ded36e02f431ce613ce3f04a2 +size 246892103 diff --git a/3b_layer22_self_attn.k_proj_input_reasoning_representation.pth b/3b_layer22_self_attn.k_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..022f40c73b62b332076acfcf32cfe2975e36c085 --- /dev/null +++ b/3b_layer22_self_attn.k_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39ca834f7dccfe76ca9a06597ef42d927499bcf9acb653af9011a43c24e21af2 +size 92585563 diff --git a/3b_layer22_self_attn.k_proj_output_reasoning_representation.pth b/3b_layer22_self_attn.k_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..64455e7b7919ff273e1e663b1667b18a36117006 --- /dev/null +++ b/3b_layer22_self_attn.k_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cee42b6840f1d28d19984006c0db08897b884848557bf0a9e3646ca4a660dfdd +size 30862944 diff --git a/3b_layer22_self_attn.o_proj_output_reasoning_representation.pth b/3b_layer22_self_attn.o_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..9b4eb3278aa5e2dd8c1be83def62332399fcaab4 --- /dev/null +++ b/3b_layer22_self_attn.o_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d56c7b0715538fc6bd1fcdbb3855b22e4fb546ba074a5caedaa47558c24d4aa +size 92585568 diff --git a/3b_layer23_mlp.down_proj_input_reasoning_representation.pth b/3b_layer23_mlp.down_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..eb4d65138cb83725f71620ee502f838fe25c699f --- /dev/null +++ b/3b_layer23_mlp.down_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b4fb6604e00ec682841cd0722b7e256f7cf08df3c3444e6f17197005e99d0b1 +size 246892108 diff --git a/3b_layer23_mlp.up_proj_output_reasoning_representation.pth b/3b_layer23_mlp.up_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..b7439144a409182ce450d36f831986aac1d9445e --- /dev/null +++ b/3b_layer23_mlp.up_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d616e3b48edecc432c8b8a9d7890cee4d4429b9fd7cf92f771f115332f2349c5 +size 246892103 diff --git a/3b_layer23_self_attn.q_proj_output_reasoning_representation.pth b/3b_layer23_self_attn.q_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..d04ecd6a991a33b52c1240ff9a2578107d52bc8c --- /dev/null +++ b/3b_layer23_self_attn.q_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:729fd569d7957b1baf79cb496e37e37d5babe5eb4773d2fd5976651d745ebeba +size 92585568 diff --git a/3b_layer24_self_attn.o_proj_output_reasoning_representation.pth b/3b_layer24_self_attn.o_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..060e4285f4f3890e663e815c911357fd8e318394 --- /dev/null +++ b/3b_layer24_self_attn.o_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55bafda58bad59b5707b5dd3b36ab774abca50104169cd2b3d83f44538bba09f +size 92585568 diff --git a/3b_layer24_self_attn.q_proj_output_reasoning_representation.pth b/3b_layer24_self_attn.q_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..6bfd773b976bfe002ccd2e8af96a088fc2c672a3 --- /dev/null +++ b/3b_layer24_self_attn.q_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2b6a001f3e189e3f37af5243920eab9670f84e92485b95ecc617e8b7e9c3471 +size 92585568 diff --git a/3b_layer25_mlp.gate_proj_output_reasoning_representation.pth b/3b_layer25_mlp.gate_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..1d211328cd88783770193a2e6f069019a7be9860 --- /dev/null +++ b/3b_layer25_mlp.gate_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d4e94d42e9e4cea85cfe02a00c15064fe52ef94471c14d0c79d6d5ae0251c7c +size 246892113 diff --git a/3b_layer25_self_attn.q_proj_input_reasoning_representation.pth b/3b_layer25_self_attn.q_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..ce6889997034dcc6ca7e06308c04e347263158e5 --- /dev/null +++ b/3b_layer25_self_attn.q_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71dba42054441ccf894aac730b70ed4e132650b75443de7b4cc8b91025117041 +size 92585563 diff --git a/3b_layer26_mlp.up_proj_input_reasoning_representation.pth b/3b_layer26_mlp.up_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..31c489bfba2d032035c47558987f647f85035ff3 --- /dev/null +++ b/3b_layer26_mlp.up_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:118f83d98580dc141698d1c02d90b46327cbcdd89c2c1bf8e088d8399edb1e40 +size 92585474 diff --git a/3b_layer27_mlp.down_proj_output_reasoning_representation.pth b/3b_layer27_mlp.down_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..a00c476f3ee874faa372a16792b39165d83253af --- /dev/null +++ b/3b_layer27_mlp.down_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d0af4cf25b11541799059da8cc1e785d1da4f70d42740df0a084838879aaffe +size 92585553 diff --git a/3b_layer27_self_attn.k_proj_input_reasoning_representation.pth b/3b_layer27_self_attn.k_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..aaa42846ebe583a8321c534bd06e252d9e748d96 --- /dev/null +++ b/3b_layer27_self_attn.k_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9036b739fa2342bc3459a47097e960fd08bc34113daeaa177fa2aa3a5eea3b74 +size 92585563 diff --git a/3b_layer2_mlp.down_proj_input_reasoning_representation.pth b/3b_layer2_mlp.down_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..e533c0a7cf0fa4c918c800d67cc153a3e37beb25 --- /dev/null +++ b/3b_layer2_mlp.down_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cc5877ed6987daad7a4a2d71f2b7f68bb4c8d3b0e32f4d3c8fcb3c984c4754f +size 246892103 diff --git a/3b_layer2_mlp.gate_proj_output_reasoning_representation.pth b/3b_layer2_mlp.gate_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..aa68da8661d994c4411473a85f6f53eebcd0909b --- /dev/null +++ b/3b_layer2_mlp.gate_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f08573c7d27f5c8b42605733e0ac1e282429ae5c335e8eaf34aa5707ffca6297 +size 246892108 diff --git a/3b_layer2_mlp.up_proj_output_reasoning_representation.pth b/3b_layer2_mlp.up_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..95c8f07c79819c585f58597a2958f1644960898d --- /dev/null +++ b/3b_layer2_mlp.up_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17dba986fb3e1a8302c6b87ca685a0b000f742ad40640dfea063afde73c6334b +size 246892034 diff --git a/3b_layer2_self_attn.o_proj_input_reasoning_representation.pth b/3b_layer2_self_attn.o_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..43f58ab217c36572bea032d6a9098e73b2d83aae --- /dev/null +++ b/3b_layer2_self_attn.o_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01789218dc1b430c7c36f73c1f87fd3eadd74287dde11ea3cd682c263eee3361 +size 92585558 diff --git a/3b_layer2_self_attn.o_proj_output_reasoning_representation.pth b/3b_layer2_self_attn.o_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..f7729947ff18e73b30c15083e8a2a4234b5a179c --- /dev/null +++ b/3b_layer2_self_attn.o_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68e0986382a34bb49ce5a811bf1b6bfa43c084b2b0c93c7cfb467fbf60f1270d +size 92585563 diff --git a/3b_layer2_self_attn.q_proj_input_reasoning_representation.pth b/3b_layer2_self_attn.q_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..2c81852ff150d0451f12a327ea52b8122da1f603 --- /dev/null +++ b/3b_layer2_self_attn.q_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9db78fc2d2b2e358f3ecec40d5c2501f7204a8f497be19bf477b2158a206321f +size 92585558 diff --git a/3b_layer3_mlp.down_proj_input_reasoning_representation.pth b/3b_layer3_mlp.down_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..ed83323cbae2ae939dc2ad8fef42442916446773 --- /dev/null +++ b/3b_layer3_mlp.down_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63c104ca08413c978c5017a8b1378b394f06955390d61394966466fc022761be +size 246892103 diff --git a/3b_layer3_mlp.up_proj_input_reasoning_representation.pth b/3b_layer3_mlp.up_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..8bfaebd6aefd99176a0046c77a61cc65460e5a4c --- /dev/null +++ b/3b_layer3_mlp.up_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e32690b43c7602828f29d00bf2889074a0f5c5d479187644735d154483740976 +size 92585469 diff --git a/3b_layer3_self_attn.q_proj_output_reasoning_representation.pth b/3b_layer3_self_attn.q_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..58c93411ffb096821fbdfbd139b8ae8097b4270e --- /dev/null +++ b/3b_layer3_self_attn.q_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:617eb269d1c1aa12e74bf343653ccefdb0f94f0c4cd4df903b900a96e5625cc5 +size 92585563 diff --git a/3b_layer4_mlp.gate_proj_input_reasoning_representation.pth b/3b_layer4_mlp.gate_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..c440d225dcaa35d3b3ce565da53a7e8e1adcaa03 --- /dev/null +++ b/3b_layer4_mlp.gate_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca93c125daf4a81f59b8a34f75451cc480681dd316893a6214a230aa59760a03 +size 92585543 diff --git a/3b_layer5_mlp.up_proj_input_reasoning_representation.pth b/3b_layer5_mlp.up_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..aea67b19806e9f3e3fe43942523fcc162d0f2501 --- /dev/null +++ b/3b_layer5_mlp.up_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a08cf2f4e97e6d3678e8d0f0c4c6b9406e8c7ff49410236c91a60a89e2c30fe +size 92585469 diff --git a/3b_layer5_self_attn.o_proj_input_reasoning_representation.pth b/3b_layer5_self_attn.o_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..a3994a040bd057da5d9f7f24330537281957aa0f --- /dev/null +++ b/3b_layer5_self_attn.o_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ab4b8ffe347cb7f5e884d50e11937df95a6cfcbf9839e70499dcf28477f222c +size 92585558 diff --git a/3b_layer6_mlp.down_proj_input_reasoning_representation.pth b/3b_layer6_mlp.down_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..a882f3d973bba484d38cc7837de31474def6574c --- /dev/null +++ b/3b_layer6_mlp.down_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b65dc9a7931ab3aa293050710c89e50d43227eeb6636448baf73135c86d30175 +size 246892103 diff --git a/3b_layer6_mlp.gate_proj_output_reasoning_representation.pth b/3b_layer6_mlp.gate_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..af69d2c039635186fb68c38432308246864e1ae4 --- /dev/null +++ b/3b_layer6_mlp.gate_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d56e7377fdb7bd5e31c4ef962f967a7b5b24ec1e396696a238b7e221c03407b5 +size 246892108 diff --git a/3b_layer6_self_attn.o_proj_input_reasoning_representation.pth b/3b_layer6_self_attn.o_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..4e3749074f76265fffedc7d8c5cf7c0e37726157 --- /dev/null +++ b/3b_layer6_self_attn.o_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a28a8ef010d883b3de3ee048521aed3ecb074f2da5a3da535090c4326da759d7 +size 92585558 diff --git a/3b_layer7_mlp.down_proj_input_reasoning_representation.pth b/3b_layer7_mlp.down_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..482e48eb761fc1b258023f18eb633fa2afca9eb7 --- /dev/null +++ b/3b_layer7_mlp.down_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e32af352328c93a082e957599be17f369981dd4c640d71765106699efc632fc2 +size 246892103 diff --git a/3b_layer7_mlp.gate_proj_output_reasoning_representation.pth b/3b_layer7_mlp.gate_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..c492a39c0af4e6448a5c8a9533782d2e4ef32bf5 --- /dev/null +++ b/3b_layer7_mlp.gate_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a6c79c24aba6514603e63e3081278b1bb7dc5b28ccea6b4cbfdb23c87ff0032 +size 246892108 diff --git a/3b_layer7_self_attn.o_proj_output_reasoning_representation.pth b/3b_layer7_self_attn.o_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..ed630076979f6413eefc698f0053d42d25fedb85 --- /dev/null +++ b/3b_layer7_self_attn.o_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:911e2aead1f9e7882f96a51791b8fe4c5c1c6e9fd6fa8bb89aaa14335a829353 +size 92585563 diff --git a/3b_layer8_mlp.gate_proj_input_reasoning_representation.pth b/3b_layer8_mlp.gate_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..1ad9abd3cfba062afcd68b08408e51aaa8c76593 --- /dev/null +++ b/3b_layer8_mlp.gate_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b96767d13d284b214183f4e6b6a882c29818d61a7ab7af02f85e2f7047ab1f1 +size 92585543 diff --git a/3b_layer8_self_attn.o_proj_output_reasoning_representation.pth b/3b_layer8_self_attn.o_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..7cdc5520f5e3008b051cf49280e9e18e6fd3fb51 --- /dev/null +++ b/3b_layer8_self_attn.o_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:075d3ef0bfc825cd31fa64ccaae203ab5b2968df878e81d708692a300b14a202 +size 92585563 diff --git a/3b_layer8_self_attn.q_proj_input_reasoning_representation.pth b/3b_layer8_self_attn.q_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..5a69793339c7da42047b45e881aea39c509a5121 --- /dev/null +++ b/3b_layer8_self_attn.q_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44e96e4be945a978e92c2b6f38d34d82e0c364a4091fb417ca9e3a34a639f5b5 +size 92585558 diff --git a/3b_layer8_self_attn.v_proj_input_reasoning_representation.pth b/3b_layer8_self_attn.v_proj_input_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..bbb6a426105f01f46c0b2c90db1e7160ec567b1a --- /dev/null +++ b/3b_layer8_self_attn.v_proj_input_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f29e3c8794661e71b682691c71326d2944faef5c0ccfba1524b5e0ef7a83b75 +size 92585558 diff --git a/3b_layer9_self_attn.q_proj_output_reasoning_representation.pth b/3b_layer9_self_attn.q_proj_output_reasoning_representation.pth new file mode 100644 index 0000000000000000000000000000000000000000..ecb5737c0c0b52c2546d5e2cb8c3a0a61e66ced3 --- /dev/null +++ b/3b_layer9_self_attn.q_proj_output_reasoning_representation.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab0a623511c4742ff0bcf2183773e4c790e1a9c2e2eac38498a5faeea985c198 +size 92585563