diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/lm_head/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4124b64808c9f85f106c4500e15a03c01d73016a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a58c7c50550bbcbef753f2dec7486d71d4ea58ed18ad32d97eff5c944a960b62 +size 205955 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.0.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..21a408adc9e06fcb529f853e412b7fea2431c91e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d232e675bda3ddd8c5d8bafefac1e65178ff2e5af26755829e33297d2adc7ae6 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.0.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c9c60eb6508bfc571dd2e3eafe9d0db7259faa4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69486bb25e3dd8434c82fe5a3ead2a1dfa67226c04b4797331968313d8cd4878 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..575bb11486f1c00676d05bbd50fa32675d9d47be --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f02cb9db3156216e4912d60814a0b2db492fb39b4acb1173aba7b61d133b198d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..119c9a6a1bfc9ed4cfa050f04e0169eb363d3a0a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2bf92f4c6b67166d177e27c40d48d9e7ef69a8c71ad082b1a1ed3447dc827a6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eba8fea49cea90994968deff144ce780b6ca1e30 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0385b8642b30f8e638fe9e7f2a4447adb55d6304fbee6ecf95067fa196445d8b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2d3a0bd6b38a6b42369ec8db5bc81337097d226 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4151e0bdc3f4e97b02c7acfa1bed718e1c5b73a5d2fe77780d060a9e972da57 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.1.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f752f11f613c5b803e39586fe21a8a7fc1224c54 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7b5446fd9d16659564bd3bb22452aabc24b2858c7d695a80aa83811015b17ae +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.1.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..211ee567ebdd561eceaafa652e5334c9eaa25997 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1c69fec9abffebbe63669f483bb7e352d89580a747e8bb7a7ce3387c6b3d7ba +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c206b367c7caaaf1eaedbcaae55c90efe176185 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c49b581eb4598a3dedcd4f309e6f97be760a9abf6cbc65a30594b5eb3237ec0a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e24571f46588a73c50e0051ddc2490a15b48e933 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ae5a1dc1ede0aa1517d26db577c1895ba7a8bb18a157a62fd7f9c1f6c51b7a2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c5d46112824a14f88d5328390d7f995d3cdd06e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:575b0b12f1517fdc762fee31aafe7d393bed48f0a1bb646828dfb02edb4ac1d0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cfad3cd524cff7c873fdf660367c8001957bd762 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6e0505969d4966e9611786fde584cbdc7dd59cc66441b5932404012a9ebcbbd +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.10.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f740714b371ea33b7c42b18ce7723db452078e0c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b298f0d68217f0e03f3ed37d9d5e60601dcf88ba99f3a2a3c462a3b2cbe0d0d +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.10.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3154d41297b1c8a7e099a38a26d97f320be2ddc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57f0bd4a423f120f1ec9ee9cd40cefb11abe7d3a2200971af554ffc2f7bc99c2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7648e81b88e08a2376bc75c6520e2600b1268b33 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44ed2d0287536f39ce90281c4861f46ad4e153ed3de343cc3f430e0a3dd0ff46 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec610f5f9d41dacc131c147ac259bfeb116cef36 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a022bd973a6042181cbfef35d3e3b713d80fe4d19711a1bc7cab1348ad4f4bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c3976c85a78b16cc08bab7e46c5108ff399eb03 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9552f811f1c2a7bcebeb1d30a31143ff5d1d9e58bb6e06e71dfe4bd01c4c72ac +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c7ecb1086764401a6f7888bed3b1c3ef46e7d7b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfcf9b0700b96650e357f83564dde5be8ba8969c15bb3c577ad1a6ceddb72cc4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.11.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..61a7d6c4d14baa41d5d8ade244734acf7d5d0828 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35a4b11a0718c856eaebfa8cdd2b04ca1b76c9cd9838921153ba12ee4834ee0c +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.11.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0fb942d0b6f9a1e08fbac961a104205b8595d9ff --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34c78902d579a58e4800c77fe1c53f99ffb98075f95292f8198f10876c6c9325 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6d4faf3e66aab96293e0c94dae03ab716042a90 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0aaad18b633fccecd57fc156095a198c1a36766549bbf4141e7cd0775202a8c1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..373a1e4d5d7dd596fed5a2b3dd8c9540a3dca14b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18357a2d9ecb3b6c57149d06b3cd192974fc693303259949e8c1a01a721a8cd7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2bbd564f204ee66b0f7753e05284b265d2b4214 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:877385f0e2dab00cfd859a6c05183b4b9e4f2f00d995d241bc4e30e7fddc6490 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a945d97e81d4127560469d9c225339397160c5b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:175b365928e6564f1cdf29d8ce8c175c10ac91e9dee9fa774a59657a2e91323f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.12.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6963de35ff8011bc18ec4ad2cec375a44d5a652 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45eddbfceb56bddec82321ff208a59907401ec142f3ba8c8fefa46b151ca17bb +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.12.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a630808621635fe769b655a7b2c15d3655baa9e4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ad60cd6d7955bd6af7e35df282c51f5792c94e834c6e155651f9e5668011897 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..25b86bc9223fc659db11217cadbdf84ada194797 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cac6af614e13e83fdc766002b4feec99feee658a6f0ff83f05c423bc20cd163 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee5c27648b6c0e6fa49a6c5495a9d87fa351e9e0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eacb144c6df95d6af84f41da62bd7e65220aa00f2b5b3724896c564b752d4218 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb0196852449cc2a45943266b4158c96cc029e63 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0e6a9e6b4554fd2756d2eaf51ef651eaa6976305cdca95f241a4d481c6364ed +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..858def3069a8a2ccf6269dde7b4e9fd6bdd17025 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a00f75cb96201562f76bfb99003bf21b1a16587198ad666d4914151c6edf4b29 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.13.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3dd6f43d6c0dd7aa231e1fab5b3ff3b60e4fe051 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7581c281890ec1991f27e86fdae8b60face680d2ca879625f46f350510c50601 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.13.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed2ba6f107c769c375e70ed00bdf8f419be6144d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ddc203209a1da1f07a55228de9f486563ade04d128a739825518ac8e8383a08 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c17103579d9b83deba7be9cd824429a3a4e7382 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94e022ddc4be78544d60954e31e0f76462616ed940fa4a05963a5b54915c7f33 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd1be310f0664b814e73ed1d1e23f219d1d46a64 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8fb048cf2e5bd726a75c3a8219fa6bb4207a0651fea719e8a036338ae087914 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a76ba358f59b7bfdc4f943f5b7c399df871273a7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fbdc9856a26e2278b5069cdccff6a5622fd6c2005cac9c6f38a4b074fcafd7a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7ed3a0258aa3831df6c1312faf815d3a3d7623e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc65429b9092c63a0e580680e31cc6a2c4306adb5a57f70d53886c148830da74 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.14.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ab6302da0c4525980ad873e90f6c38bc6488cc4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a77c4a16f50b23920597c2862034ad95624baa7b0ddb99e647bb3b65616a4d4 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.14.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..785374f93f448688dea7c775ecdb14c2ae3617ac --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29aa4d7f24553dede1f482b931213dcf07b1b9e8accb495af7df554753bf981a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee4d56caea4e868c0b1f47e8aa1d336bc9e2c3b2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:638519e41e4d64d7a94509706df8181f961786838c155e01f4dd43d30395af47 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0da71ef77fe80f91408db51f486f84594fb8794b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf7b1376c037b2a4cb1ff5d0b617bc640798193a41696d2110811ce153366d3e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3069231143f01795e5a285a5d349bd3c56837963 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d52d1a05b4a335f58c497ce0d0b57e8e3238e9b39fb32a75dc5d9e3530fa3b5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee3bcfdbd3281999da9a059cd1030ab8e9fe5ac8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74b9cf0ac99e81a27e8341387f14ee7804b39bcedeb1368cec248c7aaf6de85a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.15.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4dec596476bc88c2646e46ed040471b2eb2338d4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:279ef05c0efbbe8ab85ac1eb3f627bae2fd8cb35dbf88cbb9090934a27b01bec +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.15.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dee515354c6e56617fa9c0fb938b99d1cd77a570 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd932ac94dbbd461fa57928745fd7510d62d29c3e9e41a1d89cb026fed4a9a2d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..95742c57709291562dd91b70a3817061ae422e47 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:602a343dd3a11a8e98915139d6c186a32e7e88901ca5a1ce708d74b357649f82 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..740fe3f2b29eb3053ec3e378f3cda419bcebce36 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc7538d4ae00005fa0f0feb586765c6918b2370d51fdef4b94a323d0fd1ed9c5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1de93719f1d7ae717ed9862b0de2c665e03fa27 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:660071867059ebdb2c3fc8a488f281857aa10d475e70328cd75c8692c892db14 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b53885ca3c4c343024286fe0cf793637eed45d6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f455b4ba01975aeed7199d23d88c0a2169aecc60f3f525b6c4a2db57d746092 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.16.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..555149fba2eb885bb958a1917cc590babdbb207a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a26da039a4dd93afc02024369a164fb7003e35fc88b67a441f341e3d274d444 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.16.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5511fda05ac00132d9c32b873fdcb94abd6bc1a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08bb227472dafbfe70ad6f75a6810f9e9223f86589904f664c65e4e83a20c017 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..25b94f5f93d2564a8a0ccd9c6541b34beb731415 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:129d422832c27a4b5022f57945d772e13d481f98dbd4c845079a59fcffea5c39 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..380107e73003dc48490806fefdd9ec7004788b61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:599d22cc569939b27ff2db3fa9fab20b7ae8d53b8d05a465dc0e5ceb75826ba9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0365df005a3ecd0909d32c45ff9231c1ab8a2d12 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51d3d7e4884950dbc3b89ad7311cd9a629bd3f9cdf9aefd84d7a0407e4a44ef4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb13b21059537eb81d1f577b025879301910a9a7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:473906b9fc5ff1ce248f99163213c36a218d436c95d82426cc14ba0f9c886324 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.17.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d18d0105f966c399474c91ca7014d8451972f029 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b04c6ab0a515c68a1923dacf43dff26318b196fd452f9d7582ee3822d1863911 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.17.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f9d0d76a584a0f0a9a9cf941fad155a90c33906 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44fe06bb6479a912f360b912a5773df828607899fdc4ae7fdc2856e4a999184f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..40469779a67cae728f57767be6ff958ff7258329 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:106499040161081389288ab42c9101ae693328d0bb53d41432ba1b21c238dc01 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2692c9e73d392d1019e4e5825fc6958cc5db918d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d0d18cff874ccc0d8b65971e281c9398b7fb44cf93c0dd60310354c601f25f5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc65c53f5536392efc7763e174b0b97e3e9b73c0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0962a7661d4ce65885bfbee2fcd23f273bd386894578f193e8c9c2c6baf01c6e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6024b1e5653e9ba7612ca9ddcb2ca215e68665e6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64b72d537f39f3a2eb8c3a2b33de93c70de408b83403fc88d83cec389fdb4182 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.18.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..51ffed4cdb8c0e4b4b001c08168a14e3fa62d60d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b23f0c605b2983e0b07680a3bd48f0f608b37f0479f1dcf8f551f78220fe0eb7 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.18.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..126dfdbd09b0bb5d08aaee9dd061fe9a2fef07ed --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:417f624cfd8242967c980870364991bab8185737d8c421a86406a4eb56a3674c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fffb10057fde272e4d8ce0a1b3fdfdaa780e3d63 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea4a61993a781d1efe398a8dd3f6e62d58f0f5ed91d00e237cba4f29323bd04b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f6d63c2255596e2cca6455e9910ab684a09507e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db7de2006c2f72ad31e07596e35e91da5c397e7d57233d7eb5ad86ae0240cd88 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6dbdc1313a9b123d2fa36681f8548873f3857970 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45a24d0a8c49158f6bd880ca996e2d44140b6ce3aa6f92f4fd59503d5ccec6fd +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fcb143260811255f2a3a1feae0284c8528367256 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f5f7c0caeef52d08fe4f9c7c313104ea1dcca3ac78f3121b522de6d207c918d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.19.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cad3c80bcd8e9ea221be3456f5d654b4ce93d53a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ff48f1f7e9e0fbfa5b9cdde412bab44ee1912bec8ad4a9245d41febf662d88f +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.19.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a731ad88b319ce1c48c3adbd63e4bfabede20f38 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:559b34a80b6233e88bd4fb0adfd30c597f32c99ec3c48c69a7b8242699f88c01 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d56b9b240fb2d6e1327f3ab652a5d10f07c05475 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7cd07321be65c7b74f8ebbb5661f670c04b0669d248322a5c5827f55b83e354 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..933bcc9676966a457a7aeeb16a85eb4d9164aed8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a07c97983a941c54282045de98fd2686fc1a0c6ff22154a24fbe357944c10c48 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c235446d2ea85385fdb5fec50f514f1419aab9f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e66bea85892ff4f606dad11c0a4bec92843d3599652c71a9098ba40732e4b48 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..affe76c912f69be671bced5b5ae369a2e45f4015 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71fd0626380f034a133fdd4076159f1c5b9d6b070218efbe7fd231f6635c853d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.2.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dda60990138eb03bb3257cda7716f9191fd1efd8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51efe663f1f9f35e37ac657a944fa3fc33bc97cd3bbfa532e171101f7b690e78 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.2.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce702450a9206d1d009b8f33e63ab990d9a5572b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aabc3d6e9966a5c234f5c32a7ca8c4cfb58196c65cfbad4095bc4b029f05d31f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce8773e0d21e6e0c22611894cbfb8bafc6162bf5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c2236491d112c3f0e89adf08841d5c5b1343976d3b2a2a531da81506d64cd76 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3e6403806ae96b0439debd11c5e73a538cbe5bc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e175691dd7d18f3eda470e9dbf9547342bc8afca66091ee5663ab20dbf1736e2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8df22407b8f25785326355d54fdf998c6101259e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5da5f44c85d821485a382a327f3924dabff016bf4f353fa180e7d9fed3c05dff +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..505dfb29438d72533eba6be1094b19000fa4d2e2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a75282998c002a79f7db950510211219648c40a3fbfec4070a2ccdf387f6bdc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.20.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..81ee53a9874c4306b9853e1ee6c5252d357b8c8c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51d1efe12ad25bdcb235e458bb8a1447cad7566ea7e8be5172c3cb5e91901f5e +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.20.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d62e6430049e08be1067f68b131aee21a58c00e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1925748853cf68679da71c1d1bc6a19c317b292138441308fdaec0606bcee11d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c918546dc78d33c6628d41b23be94e9afec748a9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2b03a29a325fdd9a09aeaa6b30ac36180da9126aef0325d1dab6a8ac518a3b6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..55cd74350f3fbf8280a0c135ee6368c31f104614 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48822ee6e2f2f2639dea0d6ff4de65b6b14e07a36c99c671b34d210a5cbf6532 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..93a7b5d52cbecc0672e7f0a94c5f25ed180d9428 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62d4be41532f7dfe0ce5498bab31c87ba40d1c98cd5a7afa8cb0ed63b9e474f5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0cc92a66124f27064b68b524f4ab918dc5ba09f0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0ff9fd4e27b51b3483479e208b055f7a15978f97e42eef17b5f9a5ec3602c3e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.21.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ffb57f307702662766dc247dd8b968dc5d567521 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:084cf4da4700d00eda05f1e9da5d7255a5b49a0c575450da2fcd93010c3e5727 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.21.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b6e574a6610cb01819f7f8412c0f6149c725a49 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:783365fe6783f793a7ed436e34cb69001c0b767113bf5db19786c0143dd14787 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..93b925bb98499ffec5a7628695f2e0cdc99f12a7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:486e0e5ddfb6afeb7376ecd6f2f3bbe8d77bafb3061087c7067ae7c8ebfd75ce +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aaf2e44a0169a0096ebc6a0b953af4f89cd7ac56 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1119b9f58c33a39233a3cb162b1690014829cbf8c0ae2358b8f78e255cecc64a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3758a56a20f2b75e24548cff21e4e9ad589be74 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:904d2307ea3f7f81c3c9bac6019446b0395190119aee142301c974558a825251 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef5d921d3635374e8d1302a8677d5ac6e6ed52c7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02b8f5f4fca5900b66e6db51ace7e6149bb661df3a716f2120904fbe9fcd6ff7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.22.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e25f5986eba51a369617b2cf256d71e0371ba634 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8307ca9f5e394f5a0dcf3fd723b59e83ca1999baaee653002f614699fab6600 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.22.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..41e2f9aafdb5226d0fe4778b1efebec7eeb4922f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f27d51b8894f1bc15058cb9a34b6ce37b07c382581f5aeb58c1d5f4a80fc646 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0c1fafa41ff3d00474bd880cdac365e14655fef --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeddea9c6653e3e76ce668b16bf53125ac1c44d931eb4b0046bdddb3c7de2f2e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a782edc62ce430a4569203070dff4c3d42900c1b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:084b68a678a5c2b5437789b26a5cdc457fe9f2743dd3af7e36a4dcfbf65122d3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a069a271e2db63b5f95413c57233a44f93d40ad --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37e5a0cabc5200ee9e9a60c5aa0cd2ea7cae385ec2d12f42b8798916bdc583df +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8bd3e8b0086ceb20bf9f00551d6c231210fbf6d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1a5390e133a4ba7ff43451787181955566cb9fc00cf96929de56a1f32d65778 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.23.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..344b361486b94db4207a3faf4e53c1589f84a638 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08d0cc65ad3827c314e20bdfca59c44f1cebe74cd4f64af2304b496e0df12430 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.23.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f54ae860e3a227ccd7fc523065021843b839f8d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1838d8afad87bd9e6e0fd7f4672a44605defa311055f51114d15f5964db4e44a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6eaf1c86a6c3322084f92450d990a12605b8176 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f83f2b0457b7cdbdd30c403de0085f4e679466c8f9ddd876c5d1a2c9048f60ba +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b94f2d5d4c2b1f50d5f8e71a0fc11808ff161e6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e767a8854a01f06923244f6883d9f29ef24b21c56c5bcb169ae2454d179bd063 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d67aa504138e5d5ea8582124fef6e80116758835 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:314482c7e66893ec41ea86f7db869e7950baad8f5f31110ecca3c154a44afcb3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2390c61e683a4aff3ac114d12ef044a9169e9610 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdd64e373f853c3baeaa2324e0bca759ba44c21afaee24058bcc990c8151f35c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.24.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e16434b9d6e839c2c59ea4490410927eec353dad --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7925a80acb62ac038e94d62df18786486947d63e065ae8b0edb3619a40c23e82 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.24.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..001133c283e477be9396029beeabdb3e8c63759d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2769f8933b8b0513e17b28fbaa1fa6774e1750095635f87e25748ae057625ce +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0efc6d153d953b1bd2dfc323f0c85d2bb99abeff --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccf08517a8070461be1d462fd81d07c8497ef3a57a628db0a9ff07e1534b6fa0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb260a63e208e7b4068758a7ad495aa05adafe6b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbcc20bf631f1d9e5ac0d7a3ac32726317b477aa1678478e2756c368bdb27817 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..15962fd141036828dc9a5ef88a993c6df0f01a3a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36df4b4bf0d8371c257b00b09301122a6161de1e2cf839028b43f4c1a9a09cbd +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ce577c75435dff543e3bfa43621ad354738348c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:211b1e7b09c4e0b2226d2402969cad928068a845dfda96acb18503c3d6a2946f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.25.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..21a46194bdd4938f082e7bce1ebdc417e0eb74cf --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce71d734cb983cbdbae66d304f50d97055894aa38179d0466e49ce2f6aabb2a1 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.25.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..342588cb0fe6fe0a6dfbbd5f5c642f73f68b7f6d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb0d076c4bad33700bb48d753a359256328b81cdc658f8f77cff095a5d0f87c7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a21aaacf7c444f05ff850240b1fd67a47d9ac1ed --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9570745c9a4d573d6f05fc8c2a3633af7ede5717dfda3867b3880aebd769aff2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc2ee8da858d9b155ad10a9f0c22f17a4a0aa643 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f043ac7de985a0e17b5c1f69c44b1d2014ea1598e3cf899c468c52e371adc52 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..49bc908176d722956e10ad0fb603d4735289e9bb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92f32e1b83a66b697b5e36d4d7ac01cc58145b58798a8f76ff1407e9f0218fac +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9fa3a10882c2cfb7058b8601a6ef9682abc76983 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33f1a3072cca7aea449143a164dedf3807b6fba6255651df1a5b9ecb71e003ae +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.26.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..48f5107b3abb1709f87c86183f2d1b157f8aa57d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:879f619bbce70b473edea4fdb8e25dff281c9b153c9d7e30311696d31ac9d2da +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.26.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfa645fcf18a6ad1cdd669c22c7d7a226a1ded57 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16f3b22f433458542162a601f1d65883b9d6558b48df1963d55a45d44697827a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8905d45485374b294a8fb7107e0b0b5bd0d03c3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2eab6d781670a7a24da2aa579180932bccb1357c9c818db6734006e5d55a4e0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..525012e7e34715e0daa6b5cb926f9b11a6cf738a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43092d96005dd40aece5f608531de09e8fc7b31052dd1e44541dc5eee54a8f39 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f91999a52b5d01f7f4686906ac4daa5ad2cca93 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ab023f0e3574586e8eb5867adbcab0f5853daf0944e05ce8baf237ba6a339c4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..87d1360d8ba517c07d46a905ba733be6d8565fb4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45df4748571c666d06eb045516c3d936689c351356349fafcf09dd9871aa0cce +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.27.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fabb3b1332d85ec784fd78d4e5a507857257349c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79b540204b6ddf00bec7885785389d532bb707d577a4ecfcfe5996bf1684ca83 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.27.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..202935cbd25b3236827232061861db3a8630a455 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1e2acaa44135a760a832d3329791a576d1ca7953bdc4331aaf84420a860c290 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a71902afebe9a8c367cfe503ffd9a158e855e06 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b55433740d7ab1b66337222ef2feb5b7fcbdf95e9de534e2a5aa06a0199d4ee +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f7927d495e45f6fbadad79fcc8901c9768a8758 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c62f2921881fb4f91de43a5f6db93d0aa41215fb1cfff90ad06390d665f88ca +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..354a4720d328bedbcd49f7e27ce0a377cbad0a65 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a657d5cd81ff0458ce011c6567b2988060102441048122d9b7efaca1dc049060 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..52c933ae718991b9ad69908ef86cf4f28dc97c03 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eee636af60aaaf3a5fc20d4021bfc9ba45ddac54e00f14a6570f90e12aec65e6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.28.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a99226590f05398db3130516edf4cdf258ca65e9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85788f7f234dcd93a6ee347d86aa74f640e7cdefe58b86a33f982b3d6759daaa +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.28.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..692588897382ca56cc4204b8a137f967cf425ca8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96d7586cc9a42bc8f34c724ccbba478e88546d771d3b2ea3d3317d2472ba71d8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4892b3f874f054a4ed6fb0a350d449e226d3651f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa7ce3ff6a5f3cd3547c9c06888d068a8b860a8e23ed5d06ebdf1995d40ad4fe +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5858288c3de482a4ad3d1621ce2ab082ba3a1c64 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56d3359b933b0340823b71729cf14ae7b8e060211c772451cc13c91634219ab3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2f5ffd61dd8a23b40a7c785e7c8adeadbb93d13 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17432a394e4df2d97f433fdeadd9c34858a8aa10528e5b4674a11bc2157fca36 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6bc93c7b02d0a29cb5fd90021f08499f2c75f9c3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbc48ffe1cb3630a1138075d99a7cdd21340f6384aea0bcbc2ce199f719c43fd +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.29.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5306e89eca574b7c50cb96a6fee9af1ee5a9498 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7bbab34f4fe92d084332af0aa65f52cd0f3f9adf75c1695aca0a9cfc8707b15 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.29.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..94f6408092b23d09271884dff3453ab3c8b08415 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a54736052e5ae6ce198cbd30fcfd4172793b5f707ee5610a8f9cd47a033ffca7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9fcfde68a740e61273aed26863271d63ca5a36e7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50e7c9f1d87517e588285fbb2d21bfc7c94b5ca05abab8a35e39a69269393e04 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ae987e6903fa4af526fd0411fc8a422f741dda2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0cfe422247840f850fdad40e541630cc72d2e73c52d239ca9f4fad99cfa83d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..38be643124d4eab48977d15c26b98a73253c9704 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:203c9da3e2eeca586b3cf7486bbfac5949ae9d31d49c386ff41f9975581b62ee +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f06f07c91cc034cad6c0c388b2fb3cd3c5fe129 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3aca35324d4f2e62ee899be14912f75c983cfca65607e720c90b58852895e4a2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.3.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1bde9ca6e95815d3bf5aea6e66c49c09b8d710b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:384785f61923430dd77cfc72a1a8cddb6b3876fe2fd74f31dd60079f2007a081 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.3.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d1c74f7fe6337960204709fd96f234f06b1a0af --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4936d112cb80f248f1cbc4affb79c30c73828cc1f73f3355d804be78f640ccb7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d454ba19246f7584401af69b201acedb96e2bd26 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a820fda9a20845880abcb5095c2c2ea5f36573ba34d0bd2a156f115e0beff329 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..749bf775cfc8af94c882cc5a8db73fe76c703e6f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:729b743d973742ff310040b82a34aecf5aede75f3c80cbfb188bb8cc2d0a778d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..877e4e76d6c88ce58f32dbeb18a854c1342cb6d1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b35233c896422307387ce906829d78c65cda13b3dfeafe0440432485f431417 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..405b2d551340251d4cdc256bdcde4864c9346dae --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e1e62de728d9e1e987be68792b70211ea340e3c030c40b739e34fc5a419764d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.30.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..61f9e3a62dd3892373fdf0210e7fce73e31f31fe --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e637f239c71d73cdff1ba0d13799c7a8557b53d011f30fe63da6fbecb758a20 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.30.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebd93f85f90c41e3ea4ca07a6cbe40edd027b2aa --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c1affa4046c82886bf892b58fba3c6eb216f10d4ae3e3539bebba36db2d1d1e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..04b33b74e3e6ac9228d72162b28813461a2c57ed --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:137b6044ae962591fcbc7c624b14123cbf37efdb3a83f82cd6d428289645c233 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a045b8c5acc240aa24574768b9ec01377329a5cd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc0e750cb737532e55fa7c5a3f31912f3eb068340050acb31d2c5b5c7208de23 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..da861ecb8c1c4eb02157e501824b0794c9cfa6aa --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfd7f8395ffd6ec21cd5d1b2f0b392080548869a8b27e97a3376f0a557b44435 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bb277135475081226f18b9f96b7569e895fbfda --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84beebecd0df3eaed117d26b785f793ab603509b8a77c6ad036c53f38c77f7a2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.31.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..75e83da53c7e79dec6c9083c0823eef30a28efee --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:413bcfa97b251d19e8ec094294000f01d943cb2d1b71b54c16ae83aa621ca053 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.31.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a30f4452a79cebac4e128844fbbbd616d404eedd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80dd9e87ddd7e58d78860e95b6fab9ccd40b4e0fb4872ec4eb4c1b780d299cc6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..53bad98fc55f4aea4de5925d8d19e6ffe0af58c9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:210134d7ae34ef3248b9482a692f2a7f9dffdedf1ca0e815eed241d6663d8c8d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..292eea7ab9e981fc7ca50191d9a9bd75cb4105a9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0f1da388e8eaab0490c58c6de4de002f0e30839647dec5ffaf5a549af4b6e34 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f7c05e05e14f352154eabd4cd2bbe89cca3c72b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d880044f372a2b1ba503ba4097fb6b92284077a30f134317abb28ee99bacdc9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..54780e35acdeb42f4fee9d59533a42c02d831215 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba9da837820ff09a0fdbfe81d3591a2da889b993cbbabff6ea722e472e14a92d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.4.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..86d87d5caf33c0aed3811791c1b6eb8efdb52639 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e60955602e9f779c4beb315cda374ebc381b7bc94bcc0c005cf3cd1d964663ee +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.4.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..596800988384ba9568a26ae9a63e5ee02af582f7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9c48d9835760c56dc2ad12cc446f050b9513450a0cf4b62b990c45239cbbcbb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4cdd61348c66a04dbb68fe7c3fbeb98ab78392e2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea12e9fdac03f673d18d223de2c90e3c9038493a153efad00e3a5a4b50b53a54 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c403c9542d94c0b42ad301b6b6cead6ba21740ba --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bee54d27599f5ac55ae100649501fc04735e180423098064fabd0d5ea252baaa +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8db553d45ed1d03a3bf4c1eed446688a810d354e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:547acd847b527e81b060008787697204093d2083ef98594e1870dbf7a41126b6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..177cad66e729cb142bca150323d732bcea84a32e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0f2f36967ec29189cfa8e859da9ca25d15370f9f98fcac6b67c9c7e4d692f0f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.5.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f15eb367bee750200bc097c76f1b1db1d5e5d94d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f0de410221d07360301cf392a3059e178a7039ced45732119edab756ccbdc47 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.5.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9967e2df34935e0e0ec3f6f95f3d0dd13b76cfdc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a84458b7df5b5502fc8d8e1c4195f7175e2115eac39aff5e85f7685dc14e0ff +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..451e6e669b9e1cd0e55ad2daf65cd09a2c8c4770 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1879e1832427c96f4d17815ed2b5617f561a99121762719739f863748520561 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..47c91f20dcf9fac71187ce8fd700e3c5404309e1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f77d60c490cf97792c025f20ab7ab3c1e6a6dd4bc9f0d08dce87302845983642 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d22a16d6fe22ac6d40fa958c7316cab100cd1ca3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a0c7a8ceeced8f08f932b942717686d51a0bbfa9e140fe01203c1b74bb3a755 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5263074c675a96b812dc4cc8959f1ca66f3553ad --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:009a9deef42ede6a47b59049fb93ea3744ab2a876ae09cb67c7d9199a72fa4f0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.6.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6effe5b51e6ddf557f6cf0fd29f69eb269ef2228 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a5b7b48e728228e9bdd587539704343caf0c8f7bf7d5d90846128fc0b34883c +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.6.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b00466e16a2b2563b59cf6fdd8008183f8764e9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49f397169dd921ec804078133fad41dc0442581cb5ce3a2c464c6d7521e7e60b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b81a262ae7d87fe0668bb25bb0ac19181bf3c307 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:941ad124270e4cf8c55bebb0b2548c5ff9ef7dc6370bd97607153d6b01184458 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7497e0807971844d984d594640fe1c37330f50e5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2913306777b97826e85c6610ba2a58be78fcf04c005b89e9d52905e87898b225 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8b9758b96e98f416085ac80cbbdafa97b491084 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18825fb8f01eac50708595a01997a73a681af92ac0ee76c6c4424adca05f7b75 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa4ee887ceca32f719d53b5d7fbb36f16bea2b07 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b341bf4f92c80a4657fd23aec4b4f24db1a3166ed48352319b9535509f3b5260 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.7.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bdc82bb7e15bf14686e830621602554b1c8de31 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8611e5d3c6238abd5fd96a0b0b7cbe6035589391fed968a5e128a6fa8be7387 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.7.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..162688b05bc74d202221cdef1ddb56ccb05a72fc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1faff95e13daef5d223c1883350364da2a6f3ae8999c0aacfe6331bce6e4cd3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f634f3a2e04234137d9c2e8d65eb33b945b883f1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7e368ef83155eecfca8f3afb88c03951b72307e13a053e459814c92c9560c0e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..da7b194bd01c2fc48b9734a3ef07e4b90dd13443 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f9122fcb9c4bd62598d33ca8a9b7038e2b5542706135ed8c70125d504810845 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3eea84682fea2bc9ea26dcc248a2cbee982d372 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d75d3fee176e0b39ad29b22a12a9bf2b4413e0dca25833bb7ed82f28f37720d8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..594e09cc0b18a5dbb1a2768519c94c1d5f88276e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95fca8bef03ecf8ad7dfd98065e62cafc6a286f07bc50744720e5ecd851d4329 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.8.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e09e4b34bbd9cc55d0f06233401c819c947a96f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74cdf85c536d66a064d946ea6632cba188ea65afffa1c1a0999fecac73ab6ac1 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.8.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..73184f3387ad722715d4328f8946997b9f1067df --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7621846955a0bc7dce91cbbd51b4cb3ddbf05d389dc7a943a1d08ac6c3a708c3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4505aa69e84513b58d0c9354df90898d615cfbb6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a65538a823f6f0374c65c474761455098f6d2458d0c0da9d97f789a35e43df7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..414d1a56ff2c158d5051a32813571ad674e1d220 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb6f1cba64c0fa7f2c7ce7bd2bd0003f4e2ecea32596c992dd8c17914f542fa4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c397d4a7d150fffdeb5d9964b02ae9e16b8502fb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9c8b6d02a0ebe5fd120ea1167374cbb5bbcb4f02d25a466c0300bbfde339c1d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e53e07290448ded08a7a9de44810a59bf909b5e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26eff01232b0efb0cad2dabee2ba0dbcfc2e92ad80035dc74ca9e6f8b581422e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.9.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f636755cd5e1c338f73c933c52603d06eee7d56a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1228d94159604df5f8260c9f1f04203585b80959c78dd9e28eec834f474e03ca +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.9.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1068afecc8eff8e7b8ca84764228603bc8993df2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31e7bb024caaf3f59506bb29f571897254378e9271868a2e7e735dfa3457b78b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1dd86f98eec6a759f9d3a47e541175912f7dd81e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70e685f0454d179c229548872dd803b04d6007ae1aacbe31b73dd2533b000463 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d4945fcdc7fc62addd08b5fecb0c720d206ff64 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7933c6a36bdffa8af514088377e40a5154c8a3bb02b3985d1f96206f05a5da6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..757ec8578d7506badfb391fa72c0e317bf5b56ef --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6605c321d23561f288e3b4cf1a8eb20a51b0ac26b54fb1e6ab52cb023daf9961 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c80cbd88750caa9125f18c8f700c7b10344cdb1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/init/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4013fcee21ab1ba1ef9849216eb488076526a397e4a6497ede51d0006f2c0833 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/lm_head/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbf9d687961565b22c821330dd966d3caacfe4b1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68889309ff9f8a354511e63bf6bb1515063aee631f54c51d2776dd23779bae2d +size 205955 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.0.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6750cb21974f30dff17a0e014d5e702ff5d9149a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78d49820c650a79fcf250bb96ff16d1951b9391abaee3b17953e6b0f7032ecc0 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.0.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..585b2ded5d211a5e65537d5578c4dcd771a73176 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:353a738082eb1054170e2da9af025bbcab599de68ee30af3b9bfb298759f1b65 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..429a6af6e7b800ecfb713a607452ea2e87ef7618 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcfc43d43dac9381bf9a3afd02dcf229bd5cc7740058fd5eb8b6c81b3707d562 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c7ed949e525ecaf1e16741e04aa291c07d18b46 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba7b7ceb4c2c289e0ead7a73e9f3afb88d34cc81c3abf0129ce048e38905e629 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd9b676908b00c35d0e65b74125573440937dd09 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a56bec60a4431999de4ab4b7cfed64c759c14317d49ca4aa34eb65882550ad3c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a494dff93a51baad67e80ce9f356035ca4a7864f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a772eeff286b86b778f201fb71632c151fd99494d5a5f85d1d875c95326068a0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.1.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9fc4d9f8b4220e02a9e785e64e2be728b46a236a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:198aeae85cb199390124eee1e66928e1deb876a35509f5154f7493ee19299baf +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.1.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..58ada993286a68a1d8be55bd6c5e1ebf19e8f39c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95a75fcad6d614fdb0a26ba9de5badc0aba539c0c5c19eb849daf291106fb579 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..627ea1d41f7da965eda8e92eac9d8dec59fcc742 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d59ae159eab02b8ca5ead70fb54db9ba411cac21cecf3f17b9bf1ee3b8f0af22 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..26011b6fa21a695fd1d2f2b4e9eda0f54e649ab8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e4a788de6efc9dc4e6eedcc213fe0129e801382d87f1353e38fe9be6483ece6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7da5f51e12ba8feaa5b9e90b56e08b4ea5d726b9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d2a30327a2fa10383cf5e7984e124194d92d6e2a5b80870b1bb5d9325d73e61 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6dcb81044968bba375c3db3e5870e9162fa4a3cc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d478d2da69fcaa3819f92e903d178c1ea5a39b7f83de7558d81c9fed1dd1096 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.10.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1eaae04d11b41e1db1f4417c88c72a8cca9437c2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b24426f9b94f68d7522c9ec6d78cf5eff6448ca203ff0cb8b26cc94183bbb748 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.10.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a876f4fb1fffd929c627d65f765f5f96e9787c5e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb432e2689707c5efaaeeff49fd8a43fa7279e10a76cfc571ca46433b2683182 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8154ccc2bd0e3f23cb50a1b5ee5c8456eb474a41 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da2325b50a181147c380e878adcc31ba8eb4a4c4724dd7dece2397f963bac3f1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..06b0173fe74ef823e36b3e396e52c35532c427dd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c616be24b554b209f1b67a49e64963311514a698a5ebaafd0803fa13cbf08bc3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7e0a892ca2a80c57ab3060206f12793e0c2176d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44a52f1d9d2e035c2b390e8a3d1597525a997b4d8caa5dfc9b3b5481f33dded8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d25521570f7122cb67f7b6b153e6ce1ee13ec0b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:483d27816981c0254e7e5ea85f286c28e095dfa13ddae4a79774c33644e46c42 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.11.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0032252d99964ed92d8caadab02fbe420cd306ac --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6af076ba90e62f236d805ad3f01c91e5dcc64d03653313e8a0a1f3c73ef4ba50 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.11.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..78ac9041f20a2c266f9c37486369ce466de8e592 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d569a3834db89982c3e86fcbe4f7dee2b89c94e5472c199f082ece44bd1e1875 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ca5a12116d8e214ee3fab7a9ce8c20009b4e4a8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e50638562060f57625a2b266c940e6c4c014084821f5fae280f1fa7600278867 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e887b143370c4c0a1585eb479acf4b8366fb3cd5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92cd14348fe561e11c43841b9cd99b9cccd5276fc93299c3e62585cce0df4d36 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f03b355bb32b689d73091e33d5567c16b0dceb8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:806324a64db57e953966e9260739508713b91df2354defb45878d8978767cd02 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6804dd2bea9b46fe9f46385f688c3f16b65ae064 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92a96dfefb86e747458d4c2b82e3ae54c11c4824ad570c5fbcad4ba69cb41c88 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.12.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a84085d4046ec4609bfe16aba68eaaecfddc844b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d5474a574dc6cf31cb9954f520fdaa84be1c8f31ac07a4aed741593e7344063 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.12.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..31411c26ef02c7ea6c12c9741e36f89a8eafd597 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f16326313a181204da7e72b665f9fe162d95ed5b83d2da2061ad38d6b992b4aa +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec037a7f5b45446f0209f9fe1f14e29bb39b2b5c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77411e662aaea2b1cbfae2f6eb1d496f01623a0422c7fa4258be61e803a064f5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..23d8fd6e22a2d31912c2904bc774c46277f394d9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bad0ca479afe49932b2fd3ba8f0521c3939473cdd77b1b9bc92c71e1567eb1e4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f4db91fe14231827c97cc8fb87c1a1e26b9fab4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:231b20bb58116b6cce5837a6a37146f625d3d0d4ecd1dc221081d328da50d078 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac0ce0ecea0cd2dc579454dcde6153952f1a17f8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdeb7d64eff2e9fc4b5f5603206b64db7edaa35b3728376a9753d9b0aa919ac4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.13.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d0f59d4c3c6b76b4e16b012139893c38d9486cb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aafe944e364495c00d851e79a4d5ffc4c700bf4638aae96312cb4ba6528f224e +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.13.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8db22f272da111a6e84cf6c15ea6567342569231 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4507a2df84664e278ebb90ab09eb059335bdc999efd20329edf8cc07e4fd171 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce659747b6c176cc69f6a3353abd9d7ddde0b002 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da1e388bf85318d464bd2ee726c646d08f994c83c9ef3f6f5be3d0c76f0e6fb3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5398b7dd481bb88af52ab203b816e06e6041a131 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b64cca3e085eb0e30652cc61939718522b26328fe6056c42a716354ff50f3ca9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c534fa42dc791b460add3e08cfb3160e5ef8a7c1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff1a73f39b2d6148105368e215f67a79af8f64144406a32819cf316b7f11d4a1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3153014d4ab981c6f0338167ef933ea53ecc53af --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe4b4917e5216aea9fa62de78fd9548d34526e07d8dd7c6adac957ca1556639d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.14.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6cc118fad16d52a7d5c4c0dc106812ef4eef1675 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef21857b5676f5c7545529f1605639f2fb8eb6be6997d03efa11d0d393c5566f +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.14.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4216b51e413d82bcc8a0c3cb64300a95ea4e83c3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e74345acdb75aaaf646dbaab1bddb9b4c3327baeb132392cc1ee6112f6288ab +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d0b221e6a6e8f14e2212cfbc0af0cd89588e11b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83d99233d2f237182a02cad2ebe48443c2dc7172f5722526e2739850f3d1b77f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e92314d3977caf5d26e2f418ef2ce878fc7cd344 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0510be3172dd43d6474e3eb1ced9e5dd678c89387f29d3f548aa54c1a870b70d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ff126292b925093274c43ddd18658667ac56670 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14eccedd07da1be64ca8dcdc8458abc4875f64287e66f886252bb803afd3f8c7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4ccc7723f1f8e769fb0962ec4cacdde9b70f4fb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb23b6d433381fae85825f1b9ed6dd93ad475d31dfb2ee61d2871d4f38e5507f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.15.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..06ba1d806fa748bb7925d28b22e8df3ff7ea42ad --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5f52a016a09055182877a6902cd16d1f578e70144f854fea53b3e6a02cc1557 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.15.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdf2a2e112fe899d9a39968bda749d0c2d50e60a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c6bd886e1884bbb2f89ae1508f1bad54bc37c18353f4ffd095312f0b7ccb99e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..56ea1c773d3f63eee1634412817d76b5b6d40a5f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e26fa21107cf2da8446be19d1a70160441a32e32d8e894d232c4a81b5e8bf69 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..590740ffdb7e731e5fe752c4d9004ce43237d472 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cab662d126e1569d5078b3e40db2ff4b3070fc2e48fefa22309b938acdf0626 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6aef82100f23c2c5f3eff79cab5d420b94d7e37 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f6e34687163a8dc7b4bd8d0827749f391235fc8a7d86db8575ed7de95947810 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..47566cb327bfb2156acee2df1de66ef275a09193 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8cc791a11dd5e09fbc70b4b1bd86d3e5aa940b42d46062c0862dbe8e77cd334 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.16.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3c9124962fa31e3de640ecaaf22e0cce06a75ee --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:639bdfc2d7d50f7bb066f024d4430ad8158a8df9d2a5959cb6536fea02d06237 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.16.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..25eafa4d8669c4409534baaa49ee1372b86a36f5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb7d1087bb4ae9ff9ee33b2e6d4496378196f0dd4e6a351bbfcb8e419f8d0d4d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..39c04fde7e2a98aa32414ad3179000cad4a4dabe --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:644221c34ca9249aa5973ab6592c62ab0a7e12d0b93633aaed544300d75475f9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ecbc222c3ca556e32f706c77a84ec85f8b60594 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9476a7577b3d55dc14948bd5f22b0d081a9e93eb97734afba9b687e2c3f3b586 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..73e1e9d7717189c1ca7e66082a604d715342ba03 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a80fa2f5847cd1ffd3165fc3016bb987b29d25ab94ab4bde7f14993d6c57d053 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e45cb2e4e9a7759edb8351df7012c96fcc6951a5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e705043bd2f4d7b001e4a47676f38aba533d9e11b4fafda5c9b3864db72aefd0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.17.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fda27bc70d722af0f3ac92703a2f5d7182ff241 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2a0f7a6d416d7fedafbd60a6768a3c6e8b3d5fc81278b54791558dfe2c56b05 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.17.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6085267ba35a6a29c3edc55c1a77733de3a74c6f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6c0314f2dfab3a34b159a6363195332cd541e5745e42e2005e3c147fd18ddb5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed7da2eb24c5532f502a6be2f8834c2d48ed944d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70f5a893f5aba177c1d535cd7d385a27c3a4d3f44b63846e6bb7bd520803af8c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..55dad9d2d9716fdced2c5257a9e59a2cc2f93dc0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:785a77970b13ca60b62d5f808e5e61e32f7c6a6915b1cf705276074dc2b1a6d8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7eb5d2e46c6bc14065c9525d269dc8b62b14123 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9b1e5ad16e9e4ed3718b001688510f3dba3ef117a3131e1d5839f8b27d5b5a3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8dcd9dfc7ef5d65a13dafd364227b4d0b2502f7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e90d573b965eb3a1d6a67297499ab39016afff01a0ccdc1f44bbbeb680543c6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.18.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..06c4e8224c8439e00f3d6541102fb203313ff6aa --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0fd212b7611e26dfb8d9d87e427fbaabbb380a9613c54e50e386b8a1ffcc374 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.18.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0bb96a60fdbae9bb98b68ae8583e73010698190 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3d98e1f6b842d09d83bc489a3476fb29cd0b35fd17b24a4bc412a6c5c57f139 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a51b94e77fd30f972d403a4063782dca59b93f2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71e4bd3eccbd2c215f5477c8d609eccb586fa921e3904b26534eaa150e61f88b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c784548dc00dc33d1f215e43ab97eb9c05050ce --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:722cffdb060c4eaa663b780d9337fef258cc78c3b65d35e7161d5de70a519e33 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1dafd03d06afad30d4636392879624a31b62da7f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32afa9873513ae964cdddb769cdb20d6999781f5a55cc2b403888aa09b3ce8d5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dbc92e7afff652ce864a3c654b20c4521d02f516 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d42508ab62d3cc743a410fee64a74a80087c4b419fb93f6a0d3be5f84f549577 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.19.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6fcba825fb62121a192da09dadbbd3452a634dfb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ef0330534a8bab85d8e2d7f9a4b5235f0879ea363cbcd4a619ac3cdc366cd39 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.19.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7d5513fa4a11f57190c44092b678c5bcbb35247 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2aa20caf7cbd7df241d253747db03c8c8d66d9fc3c4edf58d6a804cede18b80d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..185b1d33e8a450ff54fac4685b609d286f5160a4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb62086c329537a7fc568f5a0e302125df6d892aaf49e4468dc6a8dc04f76338 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a877a1052dc748e316bdf1c82a8e4095333508dd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e49faccee128d2a32492a2798ec76ce68c960fe058353af774a27760901ccd8e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e015e42de7aed8bdd1b95ae7fcf944496b733d5b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32ba59069f31b5e18c5839f0cf9a57ada27173370d4ed09227ef22f8ffa6252e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ac7fa1343eaecf9b3c543f60a2601476f02bb95 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06a647ec0fabf9b22c425dbb8b0d3d80b5b6ff220f024270fd41383d6367ce1c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.2.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..38a91d534145eea7c924c520a1662c1683cd349b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56240cddf85dffb0a061a3f473707265ccc59af7d76f964426a6a2c853cf6b64 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.2.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..54ba698fdde2aaaa6064443b8e860e2ea76b6312 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c22df5dd557cd875d34457b4d35418c4260a7c0cb29ce828cfcace269c82adfe +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..777baac69de00a16526564679c6ce69125b5de4c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99d7feaaa716ba2c7a65a2a0a029536d071a078b908e126013d03154f9daae66 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..36fb29853761eb479ae91b97e645d8e7c3bad556 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9837d31464b233460bf3f6438429bab769bd3d726721578d21e2579172f33f4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a75cefbcc70ff61535b6cb9e9a8429e2b06584c1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa2050bec7e6132783b984d671f680fe6bb7d9c6ed7764c5645fba75d1dbaaa8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e673a7cc38e95036762837ea4901d675e10540fa --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8450b1e21c90f1d68149cf4e0eb31dce4cb8c30bb9c2dbb9a21d2cc01f2410ba +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.20.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..651f503f45ac17b795ec9721d9b505303cfe9862 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c96b7b4ce8d4c1b61f8a3cb0b79b6e03dacf6015c5cfe4ca79888cbaa4fb11e4 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.20.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d228fd5f6b6d33af94a65115b055a8cb374f5ed --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1434cd4706d2e237370e421e4ac56f1643e0b23dffee85addd07b47b894596b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0582d2431b814f70d927dfbe5e4e189b22ab5fbc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22c1a6a19659864131c7f812612e8c4ae041d75a9d9ba2cdcca9a39ab342c562 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f4c2f42630de2542612d3c75dca7cffde0e7007 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff10f68bbf6fbe84619844df448f49df918d1ef6c666bf0e0ce57910c8ee9a1b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0ffc951a3176e885dae4a85ba78e8b27ab3c745 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a904b48e65916efeb7e1223cdbcadb7788994fef5f643643117d9de3fbfd0bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..46740c39b0325c36d3a6a4309bf98423b8afa57a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f04a3d7306cb955d80dca6a40676297985f3af1c2bff4a0f2122c6d181be691 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.21.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..815e9bc1b6ba9b53e86e63256cf506c8b17ea67f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6704ca97c0934d741f8caad822a00d1fb96e4b026462221003b1ab2e74142a33 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.21.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..370aff7c68d998aaf56211007049ed4860b70eb2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c023505a1acf721d5dc49d59894e2bb9203551e0c2ed8657764708533df1895d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..14da54bac6a211929f505faa09ef8a8635b7b2c6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fab5b9787138862cccc00a1758ab38e76abb74a5b093b65e9741b4edaf290754 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2eb9d9bb92fc8f071d271e40d17a451f780cb11 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d40612cdbc4d2d0c975c9b69869334dd535c97fdbb07df50990693def5a2c4b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4667eda5ec01c6f480dba57c29581389850909d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9245cb8ce4d7785717317a504254f8967af98d54801606580fd69bc5a75b6aaf +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb61b3b97a05d2400480f40ddfddfaa3c2396b35 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27d69d3d61b0991f689715a11697602c5d524b9f7b20c106856ede9db112ed5f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.22.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..79f096d631d0c9dbdfbeea522378b29bdc5bac0a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7419033259fb8c06fef8e5e60bfd1ac3298f5a82abb20547f5ce1a90fdc03d12 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.22.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..53e1603470ceb6e4b29b66dbfebde57e3f6bfde6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e43b3caa60bef17ec5432417cc104f479cdc8e1843ff2ea609243593fcba7bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..23c3c40e6a81e599a511ee6264d2897acf439a2f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a3daa2791153748fa37448606310afe2f303d54439dbe795597caae031a4aa9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e6c69ac2965feb12f1403a88f9b3d0a5cccb33a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a87531cc11c7a3fceb608c1cb065b893513c5dfe6dba557a30c003fe054d7bdc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bb94a8ab8b543fa2c2ee7feb6a79e9739ab7457 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:daff6eb789623399fac4cdf55b94cfc5e7361c155fb7cdb0d8907e3a92ef890f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb7d11019a04f0d548cc3c8a34b9ed70c8638279 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3b191fc9b0e62f3b9b20e670cd21cb5b92971e8f07085459e22fbd368adf5f1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.23.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba2620f8b421dc4a7bfa95b59d9c7e093534586e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2125858005d79a00ad333455877e72475edcf76ccdc05b5d844434c900a957a +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.23.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..96d174ced5d1aa4f8d350b6d2f501491f6331356 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81f3496754cc2a96459d18190e14c1bcf1bbea707535542a05b5ae6073082c5b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..817ac2a00dc23db18c955fe37651e51791ca6461 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:698d6627fa6f5726b9aaea0041309fb67b2f1088dd395d0ef8e4a672375626c8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1bd392bf90b93aac784fa580f51090d57358a2f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f372dacf7c884c19027f80688dffe2eba7cdebc3dc186144680ec1ba26e3b108 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..44ec911685d54e7371570e9c350a7a83606e7f5d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40a98184b1a124175cf317e7edcbfe5d6fb00eec1284b0549219a4429d049cdf +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..38bd4b78562e2dc976e109001af1aefa80242cf3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b283982fbc31f1f87e0bbe1654fe8e48032faeb174ac0459cbbd186d1749315 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.24.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d81aa5ca9e62c2900e4e09ba09c5251629e8a07f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:702b26ad71f686e26ee4514b1bd52bff5670dd8e510d7cbbe57471dc79eac6d5 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.24.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d7a2484514282bf6f2cc9229349ffc3960b0714 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ad064753cce81ae2be57bf0424c7804b40375cce1f05cedbfef56527848f294 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1c69c0865196525d25ae4f06eb37bf27e8f7a74 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:573c3422ecac2161956e77fc8ef0c155091e2da30cab3c45a9829a1dae4ee06a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f6bfe4dacc7d25195906d54cba01558da92e33c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31a0055a303efc1a87f030c7983fed679991e52f9e626b5954af06012c3f71f4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..23a6ee3a426c506f4b24dc0734fda06bfdc44f7c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ce1f131ae5706ce6d2dc57ca43785e46b929134026b331af0f5cd855a806660 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdf1a5599c980fb2e6b7b26165e534913c20e924 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f722c8710fe03a50ecf29fa05d59bf3e12632141e2f63bde06b781eabdcf2d7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.25.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7efa6321cea76acd9c8addc6a110e1fc044ba211 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e605d13c70523ef751f716ac17211e58a518a282fc1868801732dfcf0ae09da +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.25.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad9f19060f6c61fa1de8043f3aaa53284d464a78 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a4a5cf8538f7899ff5889ef2476ab649c85863e3c80a7bc8c3ca824f99cc98c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..af6e4a221a771e32539042400fd13b925a6e19eb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0064cf23058d2928c455fea09d2b424011677ff810e633eb3c325066e1ffbdf +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e42e19fecfcefe9a8183163e8a8334cf7e8c623a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c34f803db311e971d3c7f81be307c99c834b95f00ee84afc57d9c8a1d320d04 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc175587df2d6bb5a7cc1485451f47a34767ac6b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:987145360dc88b6cf53ee6f204adface0fd5fb7b72283bace5a8eeb11b1e164b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..25e346aac4c768968804bfe7bf0243d0faacaa4e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76ad26c1ecd9a85ad408f9ce634f8d83afdab8c4fcf804e4f3c154f477c98104 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.26.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fef49bf7e3c8b8505ef576313ce781c181b4cc44 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3468a06e2d64df5597d461392d7b54ea5045ad6e16497623adee34aaac30c3a0 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.26.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..84db1ecc55d379214f89708656984a0fa1675976 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6ead18c80121405470d31e48d4e7c87d969552a9c7bff0c6804c1bdb9672fda +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..72df005374fd5fc5abd9ded933c5e685d58c3dab --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7543e1a64320bb5a3bda8b22f9d7d8bc75f07752318bc7b11ea432e7bd1a881 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1794bc81a434f2949f0d1634acf01df12133dce4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d47980bc51e7099b50ec5b7ea3ac7780519c94e84eae35d4e7c8a9eae612183 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9da3b62ce18a85438d87cd42174644c8df0cb24 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5306d6a6234775c90e271f0ee5c41ba86ba68d21284152b92e62e75a648d4986 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7103ef9b4c0e89c3af5d38f873a8c6d9f124cb4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8bfd6245a4ae914b630e66173ed41a39a4183c75fe9e81590058aa0b3217e93 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.27.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a2e333a13edbbd67f1045cba4c0644cd65fc101 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74f17736bf0493c88f6344b6ef3449bcf8cf244b253f6198af67b8a24c67563f +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.27.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a33437bf7369806e4a6c6ea0f08c8e76133fb9d3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d687f29951f199e0187f6c41c910505fd08f63e59f4dd822eb75116930751bc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7f2672f269e3ed343fd9da5bea16a8556c195f3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82a766915527056bac9fb19f177146bd8770b9f98473ed7514cd6b89232618ac +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c5878b77800aaaca0b6ecabbd97f3f92ba19990 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b21f57f0f7cb5b066b2feba7a8090dd7ce8ff35e2110576cae7811baad005687 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9aa0a3930a87ab4eb5a6468707d529996f231001 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e03b244f7264a263e83d047ff0dd64a62d618492f34a30cb6d6f3eb725247158 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f0a2bf59bc1d7e8c607926463581c0e5bae85d2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f6f5eb0d92c5b02c96e11af35379194688ccb6dbfa22f486f41544eac125b43 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.28.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..04a32cb7b7c1c5b5fa939b1bdd9b439ae2233904 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c53f6dd06d083c5a41985d04b975e3803f42af2a6feeb74f27d47792d546b68 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.28.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..54c419dbfe86d2ada4c0ee67766dd660aede2931 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7108a87b08ddce6b18ef8cef69db9b92ba30a3f89177cf3f1604069734cc8a6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa68a9bc9e4a00ed053710626e0e72e33d2f1d36 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:584e66ff111ead97242df09caa00636f5e38db7b1b3ff73f356b9c49942b1ad4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0b394d0eacd06b2fd79ecff302adff0804e8e0b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:165b1c80845b0923b40a1941fef4fcda7406dadb3757b3f15ebe2d2935300626 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a930678ed21dbef9768dabaf787f4ce2baad642 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4d24726fe7be9b47e1a63c89a860232558d936aa521f0c51cea8c7773199715 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f0517340681005a84c8963be5dc6d571978ec61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b15284f973a2b029bb3adbcd89a6f2e9da97e2349dc9711f28cf40fd61578f7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.29.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..871a2bbef988ef1410927c029aa506356f2a54c5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c524e809637d893db901f836e38f65258a38512f9153d3b93ffda9a7fc5bc03b +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.29.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcec9daddb83d1636639d83aa5a172474cda52e1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:589f9700ac7f2a7fd14de7493ad20da6011ab1b6cee25bf19ca3f74254794cd2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8447f2d056ba246318abeb0e4c877f2154e73cd7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee5dc893f50ed7385d04bbd54376642b6b6b559c78de02fdba025bd46eb7312f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..71b0b05a9f8ac6c4ebeac07a576a0e6d1924e301 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3c63d8b42cc2c9dc345f6e7157240f0d8cf8808fb6e7ec802c643f3bf968bb6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..96c37a015604f6ebd010db8ccc6c82d692ab4288 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc807e100877ff3a05b7769cfe8111bde4df3d7fbcd762254a27824e1d13e8fa +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f6fe59fd52934adfa53be958d52f2f9bebb3943 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84aaed0c48a9b5ce5f2ba550913f537be60ebff769afded956d3ff94040111e9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.3.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f02288f2c03babaa41d067037db37bec2a7c8c4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1a30cc42563336ad9fe0ff40c1cce894fa40fb8851d23238441eab2bf277cf5 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.3.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fdf936ed7d089f800cea47e42a7c589142aef71 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fc4892e1ed4c77be9df8c5191080b508fa61986b77de47cb4379952ffea9575 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..74eb6d6b646a7c073406bf7ce108ad47e414f52a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3108517dee8a5747ab4a5d67e38544acd53a7e560b18b15c74117b0b9ec6957d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c159a92921d7ce889284b7967cc90e0a3e1441e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4907da3cb4fc8d06f0d2b931cdef700c2377471406eb473c7395422a2ecdba81 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb8e9507d700179d108012dda1e9fb5b90b14539 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b833bec750a2089cf68c71dcf1331ebc11ea554e3d3d02a074a22b7503d571b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e17399ef6494402be561f834059dccadac840650 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88992a49fe24748567023e8432f50cafef84f55a787784206cb683e0a697dd6f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.30.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca42f78174b1e0af2c0bf6128e8b2c356cff2a7a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26f9f26420c49fcdf4c72734be48df342c6c2ebb422bd86860901fe3f1e6b638 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.30.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d8ae706d9251d0e95a57490a449147b22d3a158 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d4f725cc29915a451f1ce5fa0762f52e8650b21fe0d1160d16dad6b367452b6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb7cc090eb2a475d8ca33e7a23bb8f67b18c72e1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59742de08148c14bdbe7edbb9d25234387129500d48d446cf2167359f9213175 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a4af11ead90c39d43f0a824c34e64650954726f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac183da0722b9e88877ce7b07179c1f52a6b629e90a790780087f2a6a62f7e6a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f28cb521fd8e4c80fd02c1a6550199eaa0cc6a38 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44f60cf8e93512c9f227771a0bf5c3066e764416b8ab84246a5937ddebf1e67b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..07b51949ceb687276c7bc2391f47208d9f99fc85 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6302419487ae23be5b2168e0039a56eeab1b00f959529749779f58556a88ab37 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.31.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ddc16cf918b47b31448f675b5ff7faa585d7db9e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1acc1f94f118c4da105098c6ba85e7bd7d1b2ebe30f717f2767ec5e51d5f8be0 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.31.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..775c0d7487c6ddcdeff4f4bd4bfa51321cdf76f5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53d2d0d7b0aee2d3bb3d94f97f194841dc7c865be8f718bd6875b3b745307b25 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4e38d0aa137419e6de5aa8ad4ae36b08b4c6cfc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41a4a0c4e33f57438ddd7e76283aafc9077942d52f0cb8bc3cda14ffc4405846 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..50bb942c3a1902267b065c1b491afea642740d87 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfc8aaea170fb7ff5bcafd95bbfc552c9e239a6b9b3d4953aca7468f9a65a890 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb87eb70e1f1484478647427df238f138f03d34d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a4cb5246b5e7b95c0a91834f10d2ebe49542d0d80f2f3db424a7f9290f311c0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8aca5f99d723f223b9875999b4de80fb69fdf5ad --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b039b73275e83a664239da53d563183eb56efb0a78921ef7abd2c32173e1a5d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.4.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e2bd6fc3250596615d53c62f4e39bed232b9346 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b305c9302933791178bf08ba7b9614a1d8abfb1353af6182927640b7d2ed90c +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.4.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f339650c1113b75bb7caff31795d21786fbdac2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:030f3f925dbeddf077e37ebb30b91338ac38afb3a318694ad6c95afcf749694f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..81079442cf4cb35e1d240dbdaf889a5975af69f6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8b948d5ed514f60d717b3ef38a1ef0cb76566d0fdff0aed2aefa8d3f04188f1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..66ada7d575e55675ac4884748cc5c0c72c56e336 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcc7b5d90a03eacbc31658a0f4c2ee7dc6d6d8a3fffca5a28305812daaf042a9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..caa75293aeba84cd451f3d8e8bb9eb7d00a22fd5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99f56f3fb0fae4ff6891ffa1c539012319e7c116daaa9daa29858d1a24d65e94 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2651ae5e2e3b747bfcf088c4c37dffb241ece3d6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a67ecae268011e683e6c80c507c9903be430463b99e676f6cf9bfcbd9b2b13f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.5.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d190f808e037402b4843b918fdf5f6f82f1559c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aab174b888e4fbad41515876c89b741fbe3707daaa04a5e4885b8f5ff14ea340 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.5.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..90c97726866095d4680be13acb963224dd76bf3d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1845a962509768a8b79de39031e57ac58a5db795b6be41e4bf51f2305df77b7f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..08043b5b6854bba905fe95a7a9cf304fad838ca2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:980286040a7772c398857a288c79ed5e6488300f9c8894a7a57ea8dadfe85a97 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..07664ada4ce15f951b1f6a8bbdd6200e746ea416 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6866edfa16410023e7f9542732e2edbc1fe0c390c3f3a4a6be89cdea0c76625a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8b6608fbdb9f5c9f8cebabd4bfbb6802dd2c62a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e43ec2ef8a747064845515c6abd0dc8698be0ea503fab1b6238934cb311b795 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9cef60dc7e3393682484549e16a5d495958cf6b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f580fa25a797cf46e763e913ea2938fe357ee8686b8aafbce24d6f69fed13810 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.6.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f4417b9a4d55c6f41ce70579ed50245db10e6fa --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c935b7a7bea37301ec0b7f007c9b6d44ff76cdc57e196bac1efb5ac6e1615df8 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.6.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..151bddbed7df2561fb9c17b69dff7585852394c7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33e992cf37fb03e1642031738edc72c60b2fb6741bdd98353e0456834a30858a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c35c1d4ff6d684e897942edc15ca11733e4634f2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb64d25cbbdc75cf131368deaa683362f080733381a5d9037116e6455774f698 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..76be9112150443643d69d5af71c157cc19e79d74 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b064072d1deb77c67e3e9ef3aaf10d0942d104d95fd6d8fa8174f529dec3b789 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8201c0a00c4daa7636e801c4c94af22d7df8a04 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d6570dc490b48fd6ef03bf80b40b4d3cdf2abde78a7edbaf6967172fa7fe824 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..39150cc37ed1e3f0f1ad95568c524d4aea6200e6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c49e0c41a43164e24f52a005837bbdc60d80795b1e7c5d9996d2c5e51caabd5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.7.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..157accdd472505f7bde8c3c5b2dd4f9f1f2e05ed --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5e6ecae8baa437ddf6d395509adceeeb30b42878cd42db6661b8e7170459772 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.7.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1a4836beef67dc8de21b330d389fa25ff476bd3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bf244c78085773a91dfd2f7f0c4daadf7357f67a5db7108528bd57703536eac +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..382153fb98ded6b340f4d2d536cda66f0049aeed --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c7fd529861545147e57e561d3456cf6537506cd238af642c3657dd971b19732 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f50ca3ae889683d11966cbb9afa07ac929a27d35 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27d28f0f539f7a89bcb08f3fb1c4158294afdfddd1d9a6bf5c91e780dc0ac7bb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..548f8b9b43f7f8c7a07a7f372f2b358d43a8d2c7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ac7e592ae00dccb85a14d35ae9392bd7b1f0a3c34c40b3b1efc9e0d61c84521 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e933af67278c9c902626696f11c943a1e0b2d8db --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:292f48edf2c6f01ac4b2202f16da462db7e66a4b57ce3c61db3c3e4fe3cf03a6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.8.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..13b107594d102631b737991027ff1143569a63b8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbc5d070a27ce2dc3a919ea7ac87e3aa18783a702d5bf686fd928674919af057 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.8.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..585d61e7e705dd71d81fb6c793cfc19292238952 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2958917158fa8e549b3878f3f020ad4bed4169adeddcd571a3700a4c991259a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d2374280abc617c8879fc4cfbff9b93c021beac --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df12f71331fdd4a8b73ea9d55ec51f5aba2cff6fc5b293359c944480394e3581 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8af3b376c91506fe000ed13649b17c98e5142f5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6acd2effed6387049dc4691c555d6a35a049e5792fa43227f8086651b808c39a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f5ab4761109e38f63a771bb23897fcae85e1bc7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:daf91fac58f8cb0b315e1037fee47886ca54c2d51275496e9bcfc60501926475 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..414404fe2ed7e92890395728af4b66802a3e78e5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e7f28acf1ad1f0f95aead2271317c08d52edbaf33a77508963477d90519bd32 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.9.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..772fb98999814d9f371e749aec53f430ecb89f7a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2dc17ec139cbb0b586c3250f3e36386c561045e01bf061df8dfb4a5be328d26a +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.9.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..51aee386c56014b938bc22d7a13287f6a2b8ee58 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7b87cb7500adaeeea88af50c09720baa2af79db7d23bf07162510ab7bd3478b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2d054b79775876657536def8e269c92b4b02ff9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57633006add0d1ebc907774bd45111aa0416bf388df1edee9c32b10b0791467a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1ba8c7969ff24ef48a418ee02cc4ca8721f476c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:528e6e71009475255e9bd0931f749953985190279062fcb4ac37d117bc2b29bb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..59c86a4228d42b40027697adbcf8f79cac51c9b0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7eb9ab4d663e600488723602398cf92f90fef5bfb8a7fbc4b88ba79bc1bddff8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a8fd59197214716649a67e350c277d8d0efcff9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_18/trained/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c145a9158d41b743f96e301d0eb18db8ee8f1ec65794ba21c2acde39884209fc +size 11395