diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/lm_head/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..400e27e9d670a87b1c950985315fee980e98030c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84c29e156c1ff233ab1d70419ed039b29645b55825ad507a9e5af986fd4ceae9 +size 205955 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/lm_head/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca99896168e55d12f1239bb87f24e63f41de52e9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10ee53abb27a2ece42f027fcbe86fac973f86a0212225dc0fbadb18b7caabb82 +size 205955 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a2b51b6bf852cb9288293fad0798ccb574b401c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f9acebd16d2e1a455d56883d03d0580245d76cb7945f0af48c2b6781173e447 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..60eb2d211575c7ff212a3a87812c6e0d7d28458c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba73af99613bf3b6b5279688869dcf1a36ffdf04b486d8e8f279884043fad140 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..788c71668d7e5cb66e98741502632c68150cedee --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da8526f7b4237684b523a6da5f731c6ba7984f6e1227ec6e4bb3c1fbffd050aa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..275ecd32b6b19784c7591aae0079dc58b4937694 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df1231b4d1eb09c7d5893940bc34e7878591ca8aa6e358b63e4e85ba02b525e6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf9772c50132330887a94d18264cc8efa56a8157 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9baa93e2598360d51d4f61907c03fcca86f92675feef43fcadb6847e5592b36c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3b79aea9af1e6f5ef11ebe0d0625c5854bd7164 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc0b5205ae9ab01c599b93a63bec73ce61a8884df01f566259c9dfa7cb82c48f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3086b97cf5e6d9b9b82e6785289f149996aaa9d9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42fda4c880b477014b1c320920da812818e2f7f6a9effccbe30f7b928bed59ba +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..46f2bbf7ca7657ae04ac0c89e48de07b69a1516d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24871f8b42ac7f5ae74aa8879066cf0ffcc52c1dc3de051e94e9d46f1e6fe5b6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..588ff5ed5fdbb488a811f7325d05e310c19b60ef --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebba9812b20e36dea3895d2bca4268ab423f671e70873e0063e19d5b2e0a1fe6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9460c8307710a43b537780c9d257fc84876da06f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cabcc04ae325744f5aef58db94913fb0d1cc4374acd19dfc2f610848cbbc37fa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1fd6e485a78139e68676f84306ac76d7bee1d28d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e439de20722865e3c4f7b26818a293486b70f1ff0ad6d6a055ee84237ba06508 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..59eb0b594a1f97cd3d8f814e8236ad6cffc3891d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad5af192dcdb31bf53b9e690b0a2686921be93fe4bcbaad5abe8619db0c9e338 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ee97e1e4171caacc9e8f13486ca52bf39130442 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0efb4607fc3b423285fc0ce6df4f274847126860e24d12dab8babc76353976f +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb5e78cf6cbd1dfc351e3aaadd3c75be5ab2d7bd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b056bc316d24b6dfbda28bc6e0f58962a6a71a77c85bf3676c313657bae1c3e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..10c35610153bf4a49901e5ded18f2c8f02c10479 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edf69ca6b8d52e7e1765f50a18c9e86e58c86b891489510dd9531441efecde0e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..04f715d04cf9d600282a94da8afe6505080cd125 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed80ad01dd16b6992c8597143770a7fe8ad8cf575e5a1528db38b1f139b911d3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a236a6cca0703aa5203a8ca6b65976adaa57532 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:040ee7ba864c9fd18a3d82d0975cb588b6927a88990bef069e31528df6b2b478 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..401580facfdb281023c4ab6951c7f802d75d44ea --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:934c60016fb070c7b3bb8ad9aa46481679f79cd714bc065cfce2fb9cb705a78e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6017a9eb6d3c0e465d80e298924475fc168e011a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:840719bdd2f1042d6cfed57e500e4d3e6e47c9dfb2547562c730f0ed3e4b125c +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd50e09bd9c57ea4a31a8fa7cadededa6eb08d77 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f9a00d35309374520fd054179c3bceb52f6960539fcb3c10b681caebe00a89d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc57ef65a27f3178105659f5b0599ae69d7a9079 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:082e28085935d38a82d47edd923af3843551d3f3c7fb4662c7b1016a4a491e72 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..82d09df48f9295fea721059351f995b629e3695e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e3e5b37eb2b5eec1939c691a00cfea5ffd7d2f30f94d6b53b63576b3f9c3c6a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1d3b4bb94ed1138bcaccc2bf5587c502781ba84 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:943f814df676dd4925ceb881694201580f45be9572de47843d0313ed8d75c911 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9410a1d15fd47f67d6e0c8b9abeb91fa181543d2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f94049423ef07aac3f9c7a1cdb50a07e369c5859ce7d62ff5d662e5ba1619da +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.12.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.12.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b674d2c5381334034969e818e4ec946180f8947f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6df3aabd5c3ae2dbfb9a69919e1af4906cf0a10729759714029bc629ed1b193e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.12.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.12.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ace66edef59ddddb1eeb8a9f403986ffab1bb5a9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0e4dd8638bd60194ee1a65837f794128cfa9908226e660be7acf3cf7339e924 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..edeeb1920f0dd23ae0c63c8d9d439c44dcf80f5e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9243972ff6b4c3c1471d42808561dcbd7db0fc309bc40e99c040ed08f3603c89 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3fc2ad76940d9b1db42309c11b6d9526c39647e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c58ca5a1ee1d1a91ff1529cb361be0e631d7f4ac846457cc866a882a49efc6d3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..54a184c97f3c1d59f4176d068dd23824ec2bd6c5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d62a89388cc9d3e7cf389e767cbe7cc11251d355a879f7bda0ca304b28e92a7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..91d69d6d220d0b4b101ba3189dbe216c1e3d71bf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1914fe5e6c93749a4b3e56444b2f0ebd9cdb1d7a65a410e28905308b20ad0d8b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.13.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.13.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ba354f81bad29871212f4327aabb1a68644020a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:395c10b3b1d22c8110dbfdb519b9d74cfd6699307e54ccbdc239df2acba2f79b +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.13.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.13.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..22ccf0aad5a63272d5545197eec1827b95c395ac --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:437d369372febd494977808e201f097ed830283ca443d050bc5b64d7de6bd932 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..399fa75bcbd042f32d7fa925e76603479e7c94fc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc752cc8a3c2b8efd56edf64f3f2e6adf68640311435834f16705412a0b4cf57 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..91b5e1fda2fc9f11cb42edd5fe911ff456d884e7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41a70a702b06795702afbb1dfea8ade164580e7f34c2e704635885da1d4a7baa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..061259c3bcba42685ed6b5039697af46d584826e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f54515dd2b819720050269e0245de81cbdb768139c7ddd59ae5e3e9c070072c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbc9450c506ee363b19af8c511f8d2a69fda1ee4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0692c1b605d743525a148ea80caa3d82b519973819ec7b780707489b0981309 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.14.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.14.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..00039b3923c31b578c957484eea3b118938005fd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bca0c696fa62a73f2a0d14730f478a0630f0ddfce38f860b65bd70cbdb2e18b6 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.14.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.14.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7de5427705f0ad785f8b9cff3c7e9b98d74251a0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11b9e786a15887ad900b78f48e6b41fd720f5a043b294cc5071a467b9346ee58 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b7bc8a27d66811002a45be8d58e55a01d0cc3c9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:643e511879d7474d56ebcfa0dd8a7fb1d07bd627ae565d42b89feaa35962c1e2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bac5f2c5e29bb785984081f02591ac6cf5b9b04e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2aa12e858b2e4c7ab0ec6d079def65dc5c2b1958b84c94aa3929b7b4bb0839ea +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3e8fa64582aace9f08ef8f8d3bc411376341a0c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66249e1325ad07ba71cb5e4e6397e4a20d30026ec94ad9774785e9a88ca73d4b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e189aedda869ac272d488f9bd74671d2c3bb61c9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e6d58f4706b649685cd5e72a6b05a01301a7125595c68c18188538c3cba5f2d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.15.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.15.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb407e155fa7dcbcbd4e7757c17cee23c1e496cc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25d9058515de04f31704bda04087fb970faad74f9b3ec06e9bf7ebe4c3ba74ef +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.15.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.15.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9413d79e97307b731b6f6b885109d6b20b5532ce --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25c54eea209d13eed916f1aba06df2617946e5e626b517f08fb280335ec05da3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0fe5fd8796e63507dcc7979fa45091c89c1e9d65 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abae7ae03881ff3d50de4d809fe029e0a3bf93fc2a94468ab62bf1cfb0a2772a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a96c5121453af1a751beca0f58c1cb74d8816dab --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73cd7bef2620e46f37117b22827c4ab882bcfced244c0b23315a91aaf19eac82 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..76be29410f47a0b2d1cd10ab96a41c0911dc184a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f15c2921ed66dad0cdda22a4919c382a30e3ad9d55f43ae29dab42cb262299ac +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ee2a795172e0dc524405bd51f58f8c393970c55 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc093ccf318cef92311f7dec9457ab745b4c7d22d01f46843cfb902b49b83fbe +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.16.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.16.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5d7ecc8dc95ad8ca49ead9ea58ecd346ce38c1e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:758d4bcffb351bf36d689355b406fc3f68d2701bc4f7b23fd9701dc067b750c7 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.16.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.16.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccea322328b7fe5c072043816d2a9b2d471d14fe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13d9b81e8e225c5d8b0d6c1e4d5a23e8000c9b8db5be057d5cbe24c13feec2e7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..74253800963afa35954d70657b566d56412ce150 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d685cea21b5759ac46be92e4f9ac6e924d4725f5271f6ecfcc4aab338f7ced5d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bfde0e8fc764b8dee09b9365c52ba6c71c9d8586 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fd2f9076ecee04758dc8694c6988291752068a7de5fee0e3c611b602bd47147 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..90b1d412f1d212c08528c4629c0ed628dfd500cf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d1d6a6573d48662645fe8085750cd0ce2c9ee55e14c6bad007e7fa91a0d80d7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e211844032e5ed9f6946ff775a538ecf9fa5358f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a9badd02e7b1bf4dfbf5f446b0d70c7a0d20b78cca2ec3f5ca1d04c00e1a6bd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.17.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.17.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6656a4997d216800e582aa55c64e8195caa1d413 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e6457267476b399c4b191928b096580425508390617bd07d8d53f537248da62 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.17.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.17.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..09dd74190290b764c0e6384e774120c62754da78 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:548e35684152d6b46e837a4881236722dd04fcf4c7e48bed0393253766b06a2a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..426fd6c3f94c6355bc5900c7fa90de5c1daff770 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05e54a50f44ef6d284d4f664f623da76ab7c575a5a4341820daec3b43700f7c9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..57f9d20c68e77c01351807f8ab6c401df0f7795a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:006c310d468cc30efbd27be92dce7f408b16e080583fab113f5189b12ec541b6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f46c10a90daf582c4c02c624186f659f2bd1319 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0955de7ed0eba5833b8eeaa2e3e3c727e08c6581ce2452667a802ab28b861df +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ba20f480d36008d2fc2981a160fb74a7f9a0798 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c3d478d4b9c4b4afab0687a9371564c39fe712228e6e46d249267a2aec69511 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.18.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.18.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8097f342e6cc550e66453cf2acd589212ac3908b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7593004069919b1cff1d2727543c6df6e3106e5c0e0e5e90a128a09fcf6b8a92 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.18.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.18.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba1b99e243188428c7a0459b5153b87a5c2b2d76 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72144a5a7bbeb302151010f06093a511d62b30e4a76e70699b0d5a98c21f74a5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5975c0c4120c85f397d51de7052374c50b5a8f3a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:930e5cf64ab5f62ca672e27497ebac391cf567d17e2f684e7fa9adc346ec31bd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a402b393e310f4c083d192679892b7b45dc2239 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:499e524396ab773977c69d9307d8f353774bfb78e622cbb54d43ae7f9615c5d9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c68bd8716fead026abdfdbdfa3cf47303fc8cf5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d57078e274d5c8c2ec396cabab858eec2a4cbc3b32044659f2e77cec887316d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..17ad9846420db78c8a8ec9853c20dee4ca1dc3a9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8f3cf283c43f1c4beea89621bcf2d636618445ea03e26de24b0514f43e76c33 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.19.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.19.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d73edf144a39b0efabad828c177d2da985b84eb0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c53a53e203963467a6928c0f619bbe13e596596e915f49ef2311988bf2e81e7 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.19.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.19.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3bc502d20e5169d9045194b1e2628dab8adf1cc3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f8631cb53d87e7dfa43c27dbd6bfdd8c0d8fbfbc74bf1dce7b7cf87f26f719d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7939a598581be3e55b53e4a300b133dfa3d76edb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5477c1be28a88a647c73b3da7feb075174c1f18e1b0e2b9d0b36513dee536e1b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb9467d4a3977ff852b4ffc730e20b299d92d3db --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:675a7fb98436928da2b7f83f4d4ee1270c46f222f102b233d1e07dc8b44be5eb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e474b4b3361567d22e81fe3626054a96dbb3987 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbfc3d3ce5137e8c5acf603a664a65b1fda293715c6f3c1744797823fc5d4c56 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd777b18153a6a89e993975f2c071ba030024d5a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a4c58fceb1fd2cf60ff65a52bd731fcd10ef4734698d14ae7d0018235fc6cdc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.2.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.2.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..16d1b687dee6a40f502eb3a2c8047a05e5749982 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:598d2d0a14e4fc31b6ff5d18433d75fd172b96a1748f455c6176d82ec9e8bf7c +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.2.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.2.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff8db9afe7fa1b0d32103d6b55345cecc87ca340 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ab6d2b46875c5ace9a0fd25b3a9babc9a36d322e940b696359d8f19f3eae9ca +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..765cfe01eb98d3cb070c5078b5fd9031122b6443 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c06eeaf1a39368156125cd6f64cfb99be098f458de181d780413643634357c2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bc1516f260d9bc3afed4f158cba1c9d2a706b2d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be1a7ca2ccc64e9cc95e5f2a0332d97caf75317f4d107fcb1537c3952a692000 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d71cdd07a49b92d090a2fcff27c65c3c94aedeb9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c56e6b5efc2825aadefca4cfdbf5a13f1e6623d2727afab5d4a9db02dd4fee19 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c4e1d0e7b62e4b2e4a76ceeb5721535c5dae4db --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d88b13015cc04f2d327f444c328fe3e613cbd35cb56f638629f66cf9ef91f355 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.20.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.20.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..25ed040e7da6c8bda630b1267c97f7ede67c5986 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27815957af5cc55a4dd8307ab2540e90b7cbf3e2b836336179720e62e44352f3 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.20.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.20.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3ad9cfcf4878612f7060f930eb4aa3be353f920 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fea10e16ab63bc6f3d8f89f1645cfd44fb1f73500ced3315bf3bef29be9ec8cc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf2e94361301e88dfacbe88227231997f152f280 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:078d6d282a5851b0a24f70f8cd4cebfb803c10db79bb7b22a8eaac24724cf638 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..04aa44d902838f54a11eddc5663d6b70df216fa7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:341a2d9c42ec6336017182fcf908fc02d37058aa58c3f85713be9526d9b84d52 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e01e51217a7abbdc2a6b5f3343e678cac879120f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81be5654ca4ddec2189efcfcf292713b4d6dfcf2f98f2d40b792d028a16bb605 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..354abb3e806a4f2a000c1ea372aab3b336cacf92 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60ccc0854d30a737d51aa308326261dec133eeff97a43eecd62265bf5de64070 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.21.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.21.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..84da444a745f19006ee855ffceb72c34c4b70c70 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63c51a72e7296cf00927edd506a2f55e35b8fdbd0615bd134a15a3a0b02dc25d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.21.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.21.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b863c4f2e1b6d3b42129e7c53a0c1cbec3147d10 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c16f7ebe4e8fe889ec771477ab4d18b7e32535b297f3dc6109c19fe6119b63f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc586ba045f3af12695a08ee8f1b3d6344e0b3b2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:391d529df2ef6094cb3b699b67af33724f0d29c1d61a6fb00d93fb73a3d32abb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a36035be0362ca3033d427aaa48854bac8e2fc5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e610037b9b4cf4f7a65c82da40efad7e274e4b0ebc616791abd85f988154624 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f4c5cdb4d9e3166d48469cd64b6aa5f0459dd75 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d73e93df65f620c1fb10863f815021761a3cb0b2fb09151323cacaa5ef5e815 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c62f773608cfe40f7752eaeabd6581ae386cb0f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6808a254b8a3c49fbff0b502c7e124203a94dc790dcf9bdfb2b4888c8fa800ba +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.22.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.22.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d11d264305199f48511fe86678a996a4fe566715 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd5237588c628cb7a37b21b86d9d16e064ed6550b5199afe6652dc755f42c615 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.22.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.22.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e49e9197f66ec5e86cb6dc54bc364f696de4ce16 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd44a7c6a7e6f46cc65a7c1251b3404d72832769e8dd9c1291cc29738d2c2056 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5672ce0097f78c78fda9d79e32bd18415e81e35 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2964b68e726d745de4fc63e3f5cb272258fa8f3e74816e21212a71279704e0bd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c37dba719cbbcafabff672472f0491c929ebc0ba --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:346b5575f2d6e5690ecf2727952373fd36a50cb78c2c1748858e9c956d64aff1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..60677f6d55e33ed47e48d2e41089a64c16b4e272 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a960d8d88f00075cf44e0c78084a3d7a6ff49ac4bc01076dc983adb62a9b468 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aeacf82c2e8760bc231f00b4eb5b7f9ce0c2b073 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:937786723576e49f9572ff676e44996757cc6a1e6a1d94d9155265d50a8e41fa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.23.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.23.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c366d3dc62b03bc10b7eaf07f0472131778dd6aa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f676c71500c99b7ba12d4adc90cd8dc38aa9917e703da092d6efbc807b4e0d98 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.23.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.23.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdcf6d1129a6a668355ca857be0964618c45a8ca --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d36b5103610bab4e739cff9883f973d82bad3a42c09e939ae9b69e875a4e0317 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b193dfbe537cd7ad85eed26d17da6cfbf178093 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b824b32df0d7406d6f639af6ae3e26ab50bbc2360ff6ec11ca806de627a9c99c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5368f71814bb90afa291ae999f985b47a5a3fec9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:135c0707bfeda909ff9d04365f6583d586fa477f12e3937b9b5159e1910d6e05 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..120a526af284a190cdc0dc65951045bcc7be3cd8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d01dfb9d1bc153b1a4afd329c302340fdd187fd199b7d7fd7c4219837e65b8c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..41e7ef1029f91d456df99dbeae52b3910cf2e2f8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8815c07fb83d95e6f2d5f2a216febe28a3eb2010d17b7795a39e2978a2758029 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.24.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.24.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..281aabad830764ef9c24990c86700335b3e1182d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b705aebbd3205773366c7ae86743bb8832b73852665b570174cacefde70ea2a7 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.24.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.24.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..59153d8c91c442ea5c83b4e4c4eba01885bd00f8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71ad753fd9b0db7f48a1a0d42cba138b16c7394b4e62458ef984dd7db26cc502 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b0b3d72b43163943f15b0593909ab38427859d2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dce7e249577f60392819e127d43acf8ba99f7cad80338b6498bc7d38c4a1027 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6183a3f6a529354c475d5c47fe995e54ec88866b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbe110e5871587e32ba787bc5c4fe66ab9756211a7dafd8f64a991116e8048ca +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc397246fd8b3fc07c2d666f6cdba52add854d20 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89a7b6c8765d3b552a2827b5ee459f7676f2ed767b5e45581b63d4dbed748dcf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d2081c086bb98e34915b046e484f3042ba398e8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eabf736e88891c70f455a408a85b436b6eb1a9b5fe8a1c954c336f301342ed86 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.25.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.25.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d433339294ff8612f1ddeae22e074f6c640c7db --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d2e5d4584b38226cfcd909b2067598863473229d3d86ca9fb7f7f06b87267c0 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.25.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.25.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3a75c62fe8124b50e6d902991372ea90c3d8641 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ecfe03ebc4d4d52d50367e22ea667a66936604b53f78ec451da101e73f6e58a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..538bc88909058799a610cd01712c86c9bcc0588b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71f475e1501d1967568dd433e1cb76033e2c4f2cf6ca67ed421846be613a7d00 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0bffee4d07206b43c3f278929bf36c60c001488 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b7829445bdb88235e65093acb722e8717d79fa52b29000ce0f90a35b982753d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..27998c1cf74b392e52377c2eb82e31805ed5866b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:543793b214548d6812ac5174c0648ada2ac8f371a85d304d9ab997dc51c80df4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee7ce5d93ae20147bc16cf39e32071a1403f476e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e292f7f7453a2d4089c84fefd3632edabf0ba9f8f0a39ce772cc67891b43410c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.26.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.26.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dca59cd280f7b1ec0cdacf9f385ec129edc6d41f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15c0dede68bae6f5833381d2522dce4e9141167a6b478e0a19f86531a500e071 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.26.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.26.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9299dc2c0775866e9ec3a890c060846b70b83f40 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7e407bf2ff1d9daa7c3c8ca1f96c83b0ace614b5634b8d25c16b877c6d79855 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1098a23a94b8b6c3651b2fab4e98d2f4c87005c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:442a127aaddc5ff88c7fff23baad04dd2996a5a17ff57fe19d0ec5ca0c5f45f1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..800cf45b49ec88c90dc03678c73fb1eaa017de2f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9808774ba40516e80043092cd970bdd04e5650b02c188eb24cb6038b20b2db7d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9de393519764cb93c767f3bb3cc2a5f91af77505 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f65b5f8955bf3fb8f3f724da5a23eca236dc21ab5eeaf70a3caecb6620fffc4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..caac7755c1f0aee20d039881cf6dd7413a23db10 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:132c65e46421db62575d682080611d00bb0bb9645fb5169121d79cb9ec82a8bf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.27.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.27.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8ca85bd395988a75b26043acb2b86f0aa7960a3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:031cafc0bbf61eadd6ac823b6154c641cb86519bc77054ce2f7eb2349df57c39 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.27.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.27.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..28e2010cfcf963dd103baee59c8ca2da5f9f4cfe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5dfef5feee871042d1a2fc73195bd657fe5eb8172187e11e004377c2ee82f55 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..610db5c47efc1a2c6c90b71389201cf2aa6c6ebe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cc59882a23b64643e2530f72c6df8c9d79cc0fc05fa15db17cdfe40283aaa5c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e32e450976b565c325ec5ba3f6185f35fd65ff4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6e0c2575d803759f14c0785623a205974cbd35019deea9d8e0cf86aa0732c7f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..24624b74c831f18d2781c4539cd5079a182f096e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df1ba70c13af3f1e5c4ec29d69b0112ffd98a384bc553c80f508a2faf24e1f53 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc63c721104013797b9610908772a2e9ea680a39 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c978139932c5dc150127c31d4b0ee251a36611daf91d5a89746b52364de451f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.28.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.28.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c03496e4325106069294f97ee2d53978b6279e3b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d5399bfcb6ab5e65ff10de81b53f701f80b3dd2a1a47d4ef76ad85184b2db33 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.28.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.28.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6fd274ec7dff9adf23562c9e9ecb99d0dd417f3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eba89208261f170616fbfe5440a0e36e2d131e6c06742ee7f8f43263819e4bb4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d77bd0e4a39c3ba283afd6de1f6396cb666dbfa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f39b3697d767a8f762a79d37b58bebc6495c42b6f9d64f10b96341ec76feb10b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..164d670ea6c7f6d50c66998f54ddc50286e81d91 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:501d62c9c2d32c6193020ef544799afc95d988ce564cf1c044c9fd3aba02183d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9de4b41ad78a397d80c96bd15b11571129a8808f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:067ae35a09218a0156e4ae6fdacc78e36a68c7cc8a177f7d1056047861f4dbc3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea521667b513a473c4640d4ebc5e0578236e2eb3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b8e7a971ad3d713d9cf2dbc18385973b2253edcbb2edac1a8ef79e4f7d1a327 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.29.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.29.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..45dd91286c372c4f52e36949a187ee563a861264 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:687156df4bb327ba8f7014e1b413c816410df93b664492f67e205040385f1348 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.29.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.29.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9029111908a510f8947f04778f15e2cd0d36eff9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69585ea999c3d8828cb4a11af721e91f139446dfe1cb97e6c0364a7382c0712e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5bfca6ab6095f3be11a274f32884fc5fce13d32d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a0107048dd6a2a1761cbea3344991c4d1bda119e432c11030a87f6af2bf7d62 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0eea836cbf1e4bcd407174a3daca60ca57538b63 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60531c5785a67da95710595b2553f63184a6ec2f765bafb98da5a8a6f737aff7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..af375875d67d761a57d8b675b18dcf1fdcfcf540 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f89490527ac0f1e5e23abf6e4940a1b8f38796fa8f51c60b69136ec1477b7825 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4107f312d0a753ddf89b3b372dceb879be2c6790 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7697e4e837f745b9e80211ce004d1c7de4bd073f47963715eb7b93d66b2da31 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.3.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.3.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6d7c8291f287c5cc8c7f555282c56c85ee1c884 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13c65d5717fc1ca97459ebff46415b5bf61e2caeb5db5d03ef3938ecec00a869 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.3.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.3.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2853cfa6ba12caf55d7d6c5d3ba54d469901c33 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f662c4f3657da19ac6301235bc9ca66ca77a016d7e315bebe67c5b5d488e178a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..81363c53eef8bf23979ddfe10659c5006b3aa82f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:232c4197a3f2b42f79a0ae861ecbfd52bbc8a89e4b603195ff277d5c0bc194ab +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d99bcda6f66e2da9bc74da9840bd1819f1f2630 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39afa5f47cce557b86b1c85dd4730abbed06c339d1ee288b941784d8a4d90126 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..352ab85d563bd0b7aaebf85e438be144dd6a4255 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1431aecd28475e88d45b96d144dc1937473e28aa6d1cbad9e70f94077e40d56c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..80383e3211ae1e47abac18f21d83a2340e76f960 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79310a85f508fb8ce77e342ced6d4c1d4d80c4d532bf43bb990690ff100249bf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.30.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.30.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..162a672f16d904c0dc6617f0f07491cf72b3f2d1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e901d2ba4de610b38ba64ed796bb691759d14d852ae913828b51870406396f7 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.30.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.30.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b134481d494bf9eed9439c4eb1c57ab8d70206ad --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:221e010725864efc05b49ec18e3a454a434655647722cbbc8342d2b7cc209631 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee90f03b3f0c5ff054d424d5cd1fc9a6d9bd68f3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0121c3ba4d34791ca53e669f4d8e21aa32949ae3a13e9b052dbde855e40666ea +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c697ca1b339314630c24ebb5fc02578c50a3c286 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cba8239c5b95e1b091fbde09d7ca60cc03e155136c1b0776238e6c4a22ca488 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b208a93a757a3eb607baae09a1ab0f48944661f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9077a7574e7cf72e627a5a2ece1907b26f4196737c34143a08b6893fa2791dee +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b7d8fb34b5dee3eccc7cae932e437f3d33660db --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75b14597dfc2468068eda57c9193c00d176c999e2409d4dbece419994ef95fbf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.31.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.31.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..09e33d7eab8fd53f0dee6f6511fb930a8d33b5f1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1995af9bafb0f9e67816d11c30c2a6ff25dd973c6f9fb6922eb27a2a536cf6c +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.31.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.31.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1884b330697bc878a7d4a298276685d1bbde10bf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:291a966a77797d48c32d21c8f5f364e2322a3fd905e23447e4a9cc555167ca29 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..68f26d07af9ec508b7401aff2116b1e23c3e228c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2af04a054fcf434b07b057a5e877e5901ba4e2f2c929840b288556addcf5f489 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b6c0b3a43dedbecf3970e3b7e2f1ca263341939 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be1ceaa99ead6f3ed5a841acb6ea2a32b60691e8855f1bb0908b961ec3e9e3f5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..181a94e19c16f032b6454aa3f20b29df31cd7d8e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:867522c42f27ab2ae1cb34dfeb2873055b22f723c561f94534264357ab284098 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..33d6b18cb13c96070064c41f293b8c5686d6ccbc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37e80da78ace93ae133df6219a361cfe73f48d6cf04a2815982e306480da951d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.4.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.4.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..34c8a7748cb7d41bcb599da05e3bf9f56246d35b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ad27a08000bb820c100c8050831de42858a7b6dd369b20e7054f18d6ace6f18 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.4.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.4.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee091ee82593b1bd07d8d8f687298c41bd81d012 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:947c8a276bb66e39a79d137a232fb1fe82bce7126af38fe157c63432be5dc206 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b61012b0bbd83a88b933a6a57bc7e0ba3a5c8f49 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ba654a2916b042aa55fc85e50a89d2e823be208cdb5d04ef1d939be707c3c66 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..81354feef07e80550f09daeecc6c0f23be417049 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:389ac9b49f3852fe4084db1da0a93a0bbf3c922aff15dc4a9f33a258090f61a9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..415ba4bdd4a61d32507eb3494f7635e6e6b3d290 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f88859662018ecba5b9c3f5395f59ee082f162a3c9d01660a9851add6f52f8f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..928fbd31b3e82165064114e9facc4955486c4a21 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3b29f07fde0f35e1773363c0b703c00b66770213548bfda9b7b51a4947fe82d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.5.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.5.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6ad5208a6b635d18dfff2d8bcec627fb40ab959 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d691fbcd543cc47abe8935647391a73d4c0cf4ec44aac1f4a220f39d472aedb0 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.5.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.5.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3724585a0889ca59bfe37b2b37a9e3a437958c5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edf2abfdf1591845e94216a58355096a35e63a1f8d8c901b84d8e15f5944c13a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..244aeaa0e2770b1e3b7232cc51390872b8518f78 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f474cf09929cc0d8aad15e62a38cedde4c2c6bc1df8fe74c7b8feb1a2250742b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1df71ea4cf527f747da34a0af32e13850aa369f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec74c1f94f1dc7258d13f516429becec32ec2ef1a2dab88a35d0366a61e1fa37 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fad799d78c71ebe7893ba8c46742585fc313d767 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19ce15fd76968a4b811d1e9061320d7bedb64273a1285e3e678e20424dabfcc2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..148a03f30427ede856fb04a2a52bd82c727d9499 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec8f930bfbc031318ca213032495d35f2037e8f382987907b79b78d66e06e8c7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.6.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.6.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6c8de17d76e85f48409d901a01f88be9896e31b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4546f44ae25e4c954a74cd745705706056f89a2e7fc794479eaf2aafa25a3354 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.6.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.6.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e465e6114909141af48d9a7f9e22d84a25314c7e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a38380ee88a25f283e074734cf4a039cdb319908fc1ba59923a4699bc120d6c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a64dd120433e7b72d801e4af6420b8cfbeb7e04 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:313e61c2bf646607b5cd2d9ad421e99fc10353c89124a33cb1c49a31d562c91e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9dc43a327061ce5c10555d29729b040edfbdac5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:003354029f6c6a4f67303c9d6edcb1c7035295c054b947ff7316fa74956d333a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..666aa84a96020defd72436c81c95b75f51afbb52 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9af00463633794fd586d29718122f8243ab1eb6b98c8012d80914beade11a971 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a7621ea168f5494e389dbd645e9182fd0c114f1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa7190b1305b9bd30f0b4b80e107b18a5c46e8b629c9a89ee384562c0ee072f9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.7.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.7.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb2241821aab9db51ebeac0dd5d65e6e9a2f0bfb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54762fa8f8ad712ab175dcb2c569d8f9c33c4097d4bec1ee7f2219d4e5346310 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.7.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.7.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..faedca0447bc87d0cd55806afa5c956375e95498 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13f008cb229f823319a6bfe1a2d6134cec21c2d4c4f828deeed40052f0ed724b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..734479c9a1c75d694422891e6391fe1c0dd2a5ec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:862768a5943f8b1ddc525b6c7ee740c5c90bd0824b37492a29dba85e8383fa1a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..88a3a16a53fccdf16f7eba9d9dfd672c0b35f681 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5a270eab3dc59efcffae0a14ed238edf08c8f2b7951a068cba62eb3abc4f944 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e15940148197736f0b61d907a5af742b26fed547 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cad12125432c3a829fc82040be07fa88fc47b0d887c2c3b51383b6ad28809fd9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..38a97a747fcc1628118594ac1fffef8fef01139d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab1fa54a4884f12b715087365dbf09fe9e4d954b897d06e53e46a50e0af445cc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.8.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.8.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a955310b73633abf3ff27dfcb99e29e8d2206ee --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd42f9bd46d00b1f7c5294bd68a904e0a29b8745591f1ddbc628f77a328391e1 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.8.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.8.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7bb4a4ba884808c8a1026e18a4eb172942875403 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7e215400ded9d80d7d65019de0e6037c3be2e0db6337b6a093b72aa2b06d214 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..93eb5afc829954a6ec01f34f188afce837f600c8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07b815dc7f0937ffb330055fb5eac10b5971d19f420c6417cdb0ea0fc59ba4fa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..abb1d6a933e6f3e681e2a8aad9dae41df09f4ccc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9feb777894972fc6c6a11e9343ed2c3d21c2bbf71cf16a726a71a19853495803 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b331b8b72405a8536d8cce7ab74db19ae5d621d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f050fa14eeafa96983f37662a5a6d9c97e7dc9a4b05b8ed0f2321f1dd20bb51b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e56b500912c6b8649f38dd62ad59fd525b402de2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12f756fc7570befb571549b3ed28df107fa681e76e3132ff2a8a3cfe221d0b04 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.9.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.9.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8441087ec33c2adecf1e7935d70c468fe9e7d9ad --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba533ef6e964ad3d17e11ab9f920bba638453118ba19b632f372978e69b4599c +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.9.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.9.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..64e0ad3f8be4aa8960151d48d34fc3e517ceed67 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4c8d29f6a5682efc494eb6c370a022a2faecb638ec9add2eeb1a4f301892511 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2b8498b79666c13c63b43f31be72dbb9e3d011d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df943c245c17f8f971078224e0f5bcfb93c7e651504fbecb709071f5fd0c25db +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f964001ace29838acf2d2d18b08198de24a5115d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d26a7e64c2873e29b79c67e7c25ca3ddb6411af30d8f37a27ca9397dcd20452 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c55e8430855c9de81fca6c081f08eee7e16ca424 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68a7b91c8bcd547b4f93a3c3bc85a23cadedd4e54b3597c843b7b7fb38a1ef1d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..24cf2b8b6fb9f3ccd3b522b94b22856a21f817bf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef76d9f30b90718ead8eaf2e8af3a02a0ef298428fb71411aa1d6cd227a1fea2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/lm_head/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..14f40b7e74f9a16ed8a083bb81cb862bd17662be --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ca646daec6652aec0a42cb121760d29577b78f06256ab25d0cd3fdc76c9863e +size 205955 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/lm_head/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbd6828c19ecd49893e1317c097baf72894015c7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03066ecf2ddeca3e68015d5cb6f3a3e3c4defc0358bc404dc4db984203cd8afc +size 205955 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.0.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..265d0a84315d5bb18f6316cf21cd28dd206ede4e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e267b70cfb77f6354effb70f304f881a6a17dd8b6e83e571bd9238a7c60e60b +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.0.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8176a26290efd7053f02c8904b7fb9d3d92bac07 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52f59bccb295e5953a246d257d0129ab8c689c5f0eb4282cc266dd6da510bb41 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.0.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ba9de799266c116a2d6f141de7fd1c1ae569ada --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acfc85700c9abc01d0cabff318a7425cbb86eb1c943db5fda07a1cee99638aee +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.0.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..98f6403eb906e6a069880faa40437834a1481fec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44d973fa317878469ce0a51603d089b954cbe7d33abbd614b2cf06247a5dba71 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..98f3c321017d74d56bd91962e034b80bb46100e8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:974cebe170fc459a0431a913b30507e9c2254193514b1a6e536dac996df006f5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..62f85e958d78d3247ed590ea74c002a2525b9336 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c41ba3f708ec2d451692daa599ee1f64b42fd06674d0982d900a56f9faa29a05 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c07f41eff505252bc967a363a2fecc560ece2c4a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e3bc3d98f475fbabdacd82cb4bfe165a2716d0d1ca6f19218df8b2fde236d38 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..176d86c2cd00013a6cb2b4800d33e7f43e2cebe0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:891ddab33cd5ef8533f1525f173ec1df5d975067a4e7cbc8eb9759476a056433 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b14d353c5d475f7a06d1a39c257d5fe3cb0e5cc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5d273b12ba2b249042967577f1be475ba1ae2a9d1494953b45368b0b08ebdf2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6396fcbf8ee641eddd8e07441966efc4389210c2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1966b60d780f0538e8ea22cd3f1bcf5df8cd3c51f33680225b9fb2d013d5335c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..13db5e471fa8a1fc8f89f3f986111e4c0101d1e1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:219726b82b009d6d0385c2c480b255ceda79daa4268731920912f138b0416ce0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..da8efee6396630b363f050c80dbec57028e87e0c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b74b18489eba503f05e6614809644daa0090b71183d63c708fb1907bbe7eb99b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.1.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..308be3875afb8a88f84399b35cc88106d170ab33 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23529cc08e5d488ad37859e3b2d812b4ea9540ea54bc473a82ae6b38400ab938 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.1.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..509a9f1cda9d0435f1435d1136b8fa74b23b3b2f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60775888d7bb6050b52f7d63dd8c432c906f0d9bc5559108478d8bc22151787f +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.1.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec4418c073acb233d352abc729ec0f7dcdd83581 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:434d5819bc4a03667b2f65e73f14188afa8b4eb37a9edf0169ab74c635f16cc5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.1.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..784bd6baef42dbcfc22596c434e80a275cb5313e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d4cf08a8060bd2ed4cfaa29ccc31270ca39f22f5b2abaf8e4128318dfde4afa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..74aaf8f9826b20c5f5c04ed2530c61d24a1abc68 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4ea40870d26d5c1ae035fe67d55ac0b2889b4d8bbc6e62d42db048471008058 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ed6a30b47daa92a82d6b3148c8c69721bc394e1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fd7dacd5e203699303f32e70f9c1cb579430ea06f65b4f714b6717d27bb16ec +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..72974b19e370196c32887564cd2dc79880932379 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2dabcbb05eb50650642c27c40b5f3032d139b2aab69b9a2d75b57cc81ef0afdb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..53ba2d39f23467c16b2918c861952c28fe95d993 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1fc0b2fe38f2f9988448d09850ea602d8c6772ccf599f749ed406aac843895b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6dc41c97403fe0c33069aeb038a5ba7a2815e6ea --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3235a76093be71974fe50e237162c981b93f55a3a0b5520489f89ea7ea8df474 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ae8357f14e25a91cad8c6faa33e6a7279dbd80d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89614a58df82b980199ba0afa37c4299faa6c1feefd7bab9bd885fcbfa351c1d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..30841e9f691ca495710dc68d99ca79c55e037742 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8227d2375a2cca45598e99ac880a38088a1d68834269210ea4ff39e0935a931 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f358d1eb5a896148199fd38a4386c49a39524108 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8071713284ef8582bd1bd78878ea3dd1aadca5e6016a2df525b713b317ad74eb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.10.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..85136b8d0bde9663fb3f1bbf946918e0e76c78f5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6668186e9e2352cff2ec2e37c6cac812dc56c7e882091e341af92d9e4a59bd6a +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.10.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b792ab0c34edd87e6e2c5ebb6177cca117e99d90 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db1b76d01a3be873ba4dfdf208fa48a773c877e30dcfb1b9aaa953629ed9eead +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.10.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f48c3283b2cb9b8da047945d844a9462923021f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae30001e16f00b5ddf7aacc4d2c46c32296300ffbdd04daa283124ba63dd1456 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.10.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b94f038f8f48f7363eef1d3cbc1e4ca410549a6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dab4e55569f9bc77963c57bb5537e3f5a9ce6d021067e5beea443dd9e4b2e089 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc62390ce30e422dda7feff679de6a2f8e7645d7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41fbba9af113c1d6db1abd515da605023203d2db772846e3804de98ee302a297 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..209f9f90ed9ee05ce7723d720a8808d41050e7c6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e700b347866a2ecdef4be99b85b308a5b25f635e2129038098c48fe26ddfc3a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..24031fea86433f7cb9cf4346d76747068050aebd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73be06667f6aca5fc8f138cdce6848fc38350196c9ed8c50a316fa977e793b52 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..37b7e4b5f8cc598282ae52cad26f5f9f166c07e9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b99b7b35b5c2b172978a5672442c81dff8077a9998cbcd13764253a4d5991f9a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..76b559532e45bdc00861827f80d629e8b46c73d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f65ca2c270ed649867a4e360ff06ddf952e6b3816415e7aeb881301b75c7f8ab +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e92696393cc47f79da2cfbb48e83140f05e3c8e2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e058bbc8c48f9c8b68b0d81f6e5657b05cd2e04a2cf309ca19cb2446d9130164 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..74276dfcf5d870e28f8015e3ca96bf41c5bb486b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a744fee296883cee99293cd9c3418b30e356cb9a2315fcd7f6bcd4752c8a952c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a252a2484987768aaf1957936fb26af6e5516f9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:115afed3313203946c2e2d4211ea2c8a9e4cb7fd79baabe282aa5e27904480ff +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.11.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfbb3089a824b63f6e7cba1b80b4836abd743062 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8335fe49995f47e962f5230f10b9c64ff3a98c1b714c61ddb8634b940b5a6166 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.11.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7299b05d31806c40e09807914f33cab32180643d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:016328ea3b07fd99346f04fa17be1c0bf19ceb510420d0bd37c23f8070b28c24 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.11.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ce59ca9e1aecb14aee60f81922a8e96979a174b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea33a31d5af4c3364051e66afd00ea1210071c0f32bc1cbded9124b630a62313 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.11.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e9e3671535d446ee83c79357791710b11ca4462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:499f51553f851d22d7b576eb77f00175e2d2b7a44e1426aa8915a5b2a5a6060f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfb04926e8300f8024114fd2ba88bdc5adb01455 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aef6dec61271b30d858181041a1804a3d95b13875697d8bbdf5d6eec2987eea1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff7eae8c1ab22e36cdf7d780c343fd7258e3c128 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e08bac91c599b700faec0b60f6a47d212c4dd145c58ba643b5a011c9aaac3e71 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..186183f026a7e75beb9babf78af471e4b601da40 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:649576955437df6cc7e37cba53b6be44bf9732d799d4f3e2527325815879ee6b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..89402633ee1e4776868d6f4143f35d9dc970b63c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fae3627c23dcc6ea4d2588e2b14815aaab2b355da6ead9390df0c97685461102 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6f4db25c17e4b3bed6ea92de20fba43abf4af1e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c84f2b11e014fe49b574d1292af23f31a0afdf1a4f9426d9e77a0875c1e4fcd2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..25bb9904773845f8dcb538a6196f2cbe732f1158 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9f31ac17a5d98b633f8fed5504f2d9547a10bf30feeaa6c9cb37b08722b680c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f548e6bcb6dd7b668ea1c891e36a612b8d4c111 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cfaade3dde7389db2f8ed1c18f1eaa6b4f5787af63f27d76e3343cb190296d5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d77e721de2650f4544072458d15ec94e696d27e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5f9c041962d7f0a3a52716ded70c289b655377954ff54e374215dc0760ca213 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.12.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b47c181d27b2fabdd85371a012dafbbbe72f4569 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e298a87d1bfcc2587874941b0e35ca22e946756231f7eda51a450a14a9ad34ff +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.12.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3910bd2ffaa9d3adaf808919fce9744e23efb9c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82b74b18a33bc7f2491073df1d50b0ce0aa96d1117909ba1f654aa10a2d3097c +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.12.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d127be2ad924a93079d1d958902a943b37f203c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20674a4f04f08704139c027038f37c5de862c5d3d04a3f52ba6a5c5ef721261e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.12.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a85989c5fdfd7ee8f77884b5480eb135f17a822a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2d1dbd1c0b1f8156927628c573ab322f3d17e4ba4fca680ea18e60e9895c41a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d770ddd68046475f1d6aa5db6864ae88f9c06914 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2193742a842f82409536074267bd185fe14e1cf58b3000fd0ef367c8ec884c8b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c64ef5f84e1d6293926ae5ff96e89fd0f7f9d218 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40cddc54200976a09c7e3608a1cccb89ebdca46332d25322d876409ea7f027ac +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..02e48b0e5622846d1133115bfc2bdb5ef77ed142 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d82c4e5f000716e5dd46b58c90aa363478910bba983d7aee43739e779f2bd8cc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..84e27bb86fb9e8c98bd8032f8e468d93aec2292d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc490244d6c2109abc7ed937774e53881af872e670e8d8eb8df603fe95412094 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4fb1409c0a1ab426fcbe4e0e110dc5868f308d9e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cb0f397393220372f78515bdf3b78c9acd22f84d1f044e219cbdb3dbc54118b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8fec029ebdbf1ec49c5b85697b65b9a933732c2b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d8303a644e3767ca83970e6356a536f7737cb4e789c74fccb24a1e67bf2cad4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f07ac3713a83859f767a9440380588fe59acfaf3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ac4f9b4e72c49868f0af4eb295b721a5a6fe44b1deae04fadd9cc1a025f439f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f38aac3a98ecbf7599c99abf086dc71f6c897241 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:737a451754ec0cf7ab1d41b35f82974a059b935628a7c12167dd001bc693542b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.13.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f6ae120fcda5bd0fd5deed3de56fd084d59b3db --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3b1fd4aa8a6e3f12cecc7f92d1534825ca7f8744f085efd39a7cbd47396ccb4 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.13.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fefa5c6087797bc601907345df4011ad8f0ed44f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99435f7a61de62ed04f4de9a341d5baa8e21a3aa87e398e3e04c088976684d0d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.13.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b68ca35920ff3d07d5415a0c6a0e3878a9d29a4b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43afd4bd72bbd53f2d66202a0dad5207eb28f09d201aba9d26dc68b867406842 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.13.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..019dbfab1710b52a6afdcb18a49ca62fa574bf64 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18622473ecaf4a5b37fc1d6d37fb8dc86fc28387a0d4f3f709714ed25fb662f3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..831b1dca9e7d282d3873f676390096f5da84db5e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be1e21f0d9b91644595c5b1f8cd08e70bc3340e795134fa1c27f42bd26c4d2bb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6452accce26312ff487610fd2c2b043f790c7305 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d731cc4c371fd6d6c623bce01aa7c816bed767ac2cd39d3e3561520420b02051 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb958ace5ed15e227a18373a3f2fcd788d05600e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97b734f636d5f7642a8fce1bbf4bd470a75c9fada23ead8fde553aa1ccf0e47d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d440ea70cbee1690a553ddefbd1f7161c189693 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1948f93f42d341d2aeeeb8a7ad3ffca85f2b17e62d054b4dd2cce08f33bd4cc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4e18a4a965256e4c6d3b03870dcb46cd4fc7e12 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0108722a4f3e246f0b8b6036bfd2b1083dbec38c40a7a713d7819d16acbfb68c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..459efd0c5c3ea064c988630258f9b8f3bcef9ce8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aaf261749ccc6b5bc7a7b5b572ba9a46887d459023573cedc0590d0914348254 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6549dcb0c27f543f4a9c253f04564a720f06ffb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c0f489fe8b1e0e201b2f32478163a53166b92277e2d273a3759cf4bfdd2e168 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6389f79be8b11dbfed2886432060ed3468605604 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec6e5c29115d68562d284c0b2a87fefcb0c0c7259f2854f184915e14da746489 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.14.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..003f8063ccd5f08ba2489043c0f7e402bea1a4a7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd9c372edcc3329c9ee3134ce649e5c284074600ab2d5e6e29ebc0cd0c1ed540 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.14.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..48c48accda3fdb1740423530b7cd259c502a0808 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d1f3de940c8e127db15fc6e5a42508685ebbf1bf00889894ee375adee5210b4 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.14.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8682ff935fa8207d1699c9b0dbba3fb4397b6c5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:759baea43da82b9f5834d59f1bf8fc7ac1f2623c4af89f4a5206d8d75c905dc7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.14.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..96adc77c9dca8b46b8f0b11dbfa53ce39e0550dd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6bfb14d34734852687f5359324ea583dca1c357b87f880da8f2caf466c3bcdf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..23c53b13524b0815777d2118fca4cfe510abca59 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e7cdf23ae621c7a0410c90f540f67204f16e948aac60bd9e24c4de6528c60b2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..80de19acf4c326c0bcb48d3732cd2f3277834a3e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:717bd14d14bdce82e7e6b410322fb54c48adbbf041a6b0a00de200d004c3b8e3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8a3fabb84c4fd60193bc4634ac498adbe56549f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1e3bc1ac984938ad57d9740353064d31d900a2f6b1e28ef21d2ab5cb8f2f60a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..836fd28b0935097f70195fe1dab5815c46df42c1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a46546e7195101952bca088fe48475e4c7202f37b7a96cf6974d6f9e386014a0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b0336089537f73cd2a8e9685789910c61db9024 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01c872607253f77374e2b07e7ac134d894cba138b35994b5d98007a2bca4c8a4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7131774a48c587539e055c1eacce086c93f8f967 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ec9a861f7f2eaa158788b90a5411560bc9f35a62bb93bf5bb6415617aeaf52b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..862514ea6b76e9cb2339742ea1d5369aaf13c68d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:823e8d549038fb381bfac95b47f561a5fb7f6869ba1ae48acea8d734df4ef34b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a25449f593b57256a91cc1c63d17a1d962b7eccf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:329812f454b49984bc66211abcdc7a94268e929aa56d9e00c8cf3eb1042d0a61 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.15.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..21f403fdb95054363c1d9b65f7c59b43535688ed --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:172c102da516357b79e82c635dec942297e3ab0abd2cbb7d398bc3a521502f44 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.15.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b87de7c69aabee06bd79d829db47c98bcb31fbec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d5645951b510e6b8ddd5c528ed611b279d7397cf573a1c441286332c6f4b8a6 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.15.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c688feff47d76ad8176530d409a8c994064fec9c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80082fedfb590da256a8aaf57244ddae3115a4a996b95c1dcd891a6ea79e6658 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.15.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4c453d55e222eb9b0c57e9fad07fddb112abe27 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5bf2d1f258bd1174598df65938c35588fd968a0fbdb0ba456b3ea70771ce923 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3eb6908b11ef1ddcbf1bea23ca9be4433a4ff1cd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:876a0e014de92bf79d1db63bce30d13b34124d4a5276cb0fe05da5ad77d96ad6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..db124f364d09914bff5340d276fafb06925564d6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f540de68cbe4c71555d70a73ea2a75b352f7937800009b868a7f858eb1ff7bae +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..89240a726266972719cefe38d265bab0aeb0bb91 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:998e2df3663b54939b67f99063b1749280dbfcae73139e9c457b53b4f3fb0f8f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0707dfd72e179cb76bf97de47beb5cb6b85c5fdc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4845cae1f9a2059e6ed29b98a3037a841db8387b36ede3303106fb3cbddb86a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4dd6fbf39e9a0ba3cb481c0dad1f8ede0f8a6ec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f665f92343b8b50ac540bd2bf66c4c81e0d846715b28bc76209681d80a241abe +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eda3af8cce979a24fab0c25f80f9cbc8ca7bdf84 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:588cabcf2b7649acbd3a141cff72946b4c1f36b2f1a3986607b05fc2dc4b4743 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..94e48548e088d179e2105f6f86b66e58c82f4d7d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7df6e27865036cabb67b330b8adb2c3ca8c049bc3bb2988e09d90c1976a9f658 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c71c2846f824a696ca6ff95b1d7558e29f5b4f4d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a4d95e848e42c973fc712b45f6f78595a86890b03d1b6b11c39dfe956715c6c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.16.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3698bedc7a4969f0d5290d8ac58a29317459c1c2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c4a269857cf1abcd6c247f677837e26aab9cac5af4d6b3e10fa0f2c470b62f2 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.16.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb02e67200a80ecb164bcb1f8ee45159e7b1d1f5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e748ee372a772fc99daa5e5c5278626da4876071389641824e5cbaf027317a6 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.16.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..617400c1636f92c61750097e5f6b7c3848a2333e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc5280580b9fde7fd3ea02a05ff0e973bd79abd7b63258550095e3a02cf15e6c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.16.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3cdd4ce7678f0288fe986c4340110f670189dd04 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:720a9abece22ab06267a4baa3d852a7755619635ba0b889fe31721b425e8713d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcde879980a529581f32d3678bbafef58e7e6c1f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bd6f2e69d69a22f2edd100760a525e73d5867c9e720a03eb685bf8b44aed9ee +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c51138156592c141af6ecea3611e770a39c44c4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a5402cba0ec28e15506e9ded3b8c3b680c0a647573e9adb9fd043550bdcffa4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..11506fd50f5b51900877b049d972b6edf98cb870 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1f6698068d0f52b29885f74fbe81c08fa64cdf87f94f5d6b52765ec59f9f149 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d499d5a598ea8683701f7086bf8401446dfeef0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:355903a26e90cf1de1378cdc301fdb99b9c43440faae52519acc7567687e01d8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbc1804e1f80954f9c7f35ef002f916c4c085784 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7333473aac0dc587251e3af07b329b59b42b9de0835b94832bcdc789ed8ce9fc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e342a6e9de7fa404933fc8529d7944cbf5f8cff8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba6aa31f116a600ac6370fd6bbdd9285fc17a54b2f80ed3d23784cf4e26bbada +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d66cb99c808ac91014daaf8b21db60cb68d1ea9e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d0fe91ec11fab665a8ac607073ad398785bc293134f0f8928e274446aeb918c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b93a6cc7cb8e654f29de2f07aadcb2c9fc0b641d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:297170797941a9a7b5237b5559453e58b6bc6aba3b503f1d5b517fc0356f0e7f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.17.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..074df99601cd4d481e11f73dbea0b0261bc16cbf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af45b215e452ea73436185bb42a380620f84bd082e4a65cb1370f0178642a6c3 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.17.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5997b7f4cd143788246cb766c38ce385a15782fd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9947ca1f12ccd4e38ad23dc560d3a1bba6ddaf025b223bac43374a19e3f9010 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.17.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb0a6b545057764b7d2138b6b26f0ae6e58fd1f4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c713b123353abee9545060f7a5737a7026c90647d6a019322c59380748817973 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.17.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c232065268f01c0d438af35be2d29807ffe20c67 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2a13191a5b6bbeec876a9db31ec0de24f8a2687797a1a737c364bfb3b6b0e2d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..29e493ab2cd00c4677c2da0b0046039d181f452c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07d2c0432651ede3f648ae27c06b86cd1aa8c6aa6e7b0cc7837e99eed2d33b9f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a1023534da626bd950d23d2e2673384763f7b71 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e533eb9facb1b744aed1a18f132713339fae17a07c6478f09b6a93752b07620 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b07e905d3c53bc3af5a1196d9ca01d79a5543635 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfc3d625246999d6f0fedb0170c96e5ab14fc785c0657863a413901ae6dcdd35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..18e932cea7ed9d9a9c5327819c139b464ca61651 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e5743a79edb1168bb2ed8bf7cd2452cf42b635225b229371eb743b0e1433a0b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc9f5fdf3b52afcd76a5d78223dbaa5399e3f643 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:381af017464e340f5622a1c95700d538b67af1438b1514287b173f25a2f7761d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..69356da7cbd2c29b77b74604ce8fc6ff42a14d42 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6676c3887b4fdabf6635bf7c7e22d71dfd1d307a403c4bdc4bebbee88ec6396 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e24ad4fba4f6d9bb093bd1ece4c7a14aed82e8f3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05dfb89fa392c28356afbefe25642a293c8359e4bf491c01c8c0d4331d1975db +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f41ba9cb4a824e57fb6d8154b7516fda032109f4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0013e5995c7fcb020f000f5edfd3dfc3e1a3925dde3fd8e1af36d3648bc1c0d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.18.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7662c472c265d2d4df2f11dc96d648c432364ec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6df7e745c7a26dd7a8f94ff210be5502cbf72a0b51f47e60c83c05c546541130 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.18.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b68b97f4fe14ef6def35d53b922787f9e1420366 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd94f022a454e6ed5cf6f2540c0ef55ef38d76a6c19f7e11b0f4463ca24618ca +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.18.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0355ec8b38f013428cb4caca70503260df601565 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ca9d73b8a900c7ffb1ae7560079a4937c89ffcd1e05fc9947dd0fbcefe5ae18 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.18.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..75d38f997520754c51bbf6baa49f70ef69d95094 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36a5fb0c5eff71af92117d22750ec095c2ccef4aab525d199706f222b70695b3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..80b7046bf30efd23d65c8a5e0c435a4512a738d2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:690ce8af585d1db9a6f6cdf830a98188fa5ed2308ffd469c185f9327e8ee21d4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e456769201f636f348873d9378e64661c2dfb06 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:361c98b7e3d424534796516abb13ffda5f50bc0cf36bfa5f350558a59531a800 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4748e751adb62a0c69b082e9516f5681e6bb6d0d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:593457f2c355cbd0d00098203076375aa0c84c1af47cc24e7537e0f61bd7f0a0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d3c4ac1279827237c8adc5a2092c2419bdb1b1d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:631ddec691f2bd95bb270aead70a072db281179fe922a79b8be7c637daec6594 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5f2315346854fdf44cd4f5e3bdae1539c6d4d71 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4717bc9d91816eafd73c266b2626db92a12e4ec02dcfd6e7f3a3abbe3dd1414 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..914905cf949be349ba199e3eb96fd0fdbd513dae --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:518525206959ceda362cdfae0b46bf8f043ac9ecd06eac91e72286d5626be8fe +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1b57eb458c52d6f7444720e2cd72d70b171d880 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52918b0974cf4d441080ee5135a0ec5a537b4108f47a4afc1883598b344754f1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..21148369f0c949e0a0bf70d4f8fc860f661bc6b4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e88ebdee1c80cea6243769d012fcdb7ebbcded55c73f13a0297b74bea4f153ee +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.19.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a14b7e30d91412e963ed90eb542d2614aba12e1c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba5b66629adba71f392a8aafc0a0243230cd088691f2a8c077c73aae15fd2216 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.19.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe56d5bbbe8dbe11854acca72b924243f22b69b6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c51b44acbb50a5246915ff9e8457b6ee9ad9c9654c13139e126df15697dc61f3 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.19.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a15afa2a600f7e7c8b188cf992b2eec0de0d61af --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a072fb1cfaac3260d63279f03a00500f9bb5beccfba380a62fc0ade752e8574d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.19.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..957f12061bac81fe71ff1be4d14d2a08a227c979 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35e1071eceabdfdaea8c540b599b5971a95a843f5adefd86c20ef57d3e6a3358 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..343e45f461eaa6ed4cb301a4e72ff04f8c15e172 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e893e522e2060ce1aa57bd77b2cc3b041d25222e222054d2a6944371a5da1173 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f06cef6813b6e975cb77a6c5c67dcd1a3067d79 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01535eb81d5b82ff381b2c74357f67ecc9e5a8c926db39a1c677e7f4e4dc2dfa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d1c81366c180ede6e8ae95de582891739f15ae0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05e6625c0c1faec52e84238771f4ccda5e657d7f57a54037ccbe10f34ac53eee +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1db970e39316fa2a31d7a2459a33e54651ea4eb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f127c8ff2cb89205e2c9a5a594c44896e18076c4c246fabdcd4fd29ab71bf2e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..86d2039bafb8cc6af1635b2bfd4ec03e0a5bb5db --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2aafdf241f0c9f7319e6aae559b7dc7aae27084707edc63389c95c9d661a398c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc92799e90fddff8ff3d3a1e07afe5e49248e441 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f20784d42bfa4c89bbbfb33bbd16360d6fb4409144287d7439973e635b1a7fc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f511fc32054efef266ff3e02aef96fd8056f196 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f3f6457fd49dce958334ede8bbccf7fd710eec26a1d4c2eb7447fe1c5c9a6f6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dce81b8946c96ce7c6191b3d48c1468750a9b775 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:029b93fe52fff148edf4d2ab68c8f555b866c1a33840ce3c5b984fcdec4505a7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.2.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c669419fd2d38c748d0593d15065d2fc3f8ce514 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f053abb62363cdc6d2a26aa87e9b13d1a69ea3c720445ab296f374db5a9cbe7e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.2.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..60916e5db89b09fec71947aa4cc8afa6183cd9c3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45a07fd4857f0084ce1add5483c1539a6682e268c31c8d58625b7ba7a786f3e5 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.2.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8bf81dc2b713e5b8e16fcb87e4db455ac8385fe8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa02eda11e114da23df01647e3cd234077921f096a745607e38385e75416bda9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.2.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0f7763ae54e392e3cd441168bb07bcfdca7cb3d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a3007920b9fa3b776c4908ad1e4f9a796072b808954cbe7844a9f99252615f8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..55e78378eb9411439cf1ba455b09c9a44e956d27 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8f7dd25e1c8433f4c291cbdc5c20d1a93570597d45c8731c3affc6039a9a5de +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d68dae874d57526b9f9f41b2f53e93c97aaa79b2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea700e0e4664ab5f0dad356f18ef1444b50448297218b6dac6c1d42627d59025 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..153b4ca46f4273d4c2d4668bba334c2392c0b0b4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5090ed7647b3e5d7ea0ae08482721daaf0ba303943187eb3d88cb06b097de2b3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbf50fc7fa2e9e6faac2fc048ea83f6c87e7425a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9923082bbf89806d06ed8eda9127fabdb79e9689d004622054f50ed8e6e54a82 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b669eec53bf84c321f0027d125cd7e063fd9c79f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aa75b1a1a6fbce6f14df2b5136f3a1701052443119919f8710876df3aa4515a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea080608a345d198872c8e67641f5d274ec089bf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c559c6ebc6c05dccffdddb87df4f5a624a028465ec704219e7fe971774764bd3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a85ebd3423c632a47cc26cf7e07ebb87c45e1e7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5ca6b50ce1a011ca3f59c0f899ee16a3fb1d60995627623530677f9b3302b87 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..63a097f4bda31e85a203e26f61bb0acb83f453d1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ce21dadaceb0cb51d81eaa72acf4ba6b84ca0527318c9d96cb0911e9312197c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.20.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f930a5c4f3af73c9bc1b9eed302a3f11fdce44c8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7759a73bfb878b9ef801bed65833c3b9dfdcb6c3545c893277aef4e82129b67 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.20.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f496b923e9a3c5cd348864d5f5682ee5222f7fb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b704495bd60a4eaacd1c9af35258f9924d883a00d81bb68ec4cdec934d046f27 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.20.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7540ac6d905b0c877de2c60fabde9a3d6d666b1a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78c08b9fbd7132566983d38c633e42a6e2327df51d4abe1b62a37c3346791c2e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.20.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1f829fe544c10c3590832dd0878da27da5547ed --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4211f49c0323176efcdfd16c50d12531b4b8ec07f0d59e59f39df6bf579a3419 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea8b201deb563916d22232b7a017d8a60ef5b610 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:488955d9de124f0c7c11607904a9f51e169b0ba86e4ad1ac9e875b9cc2e42bbf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b3671c2ace37d9e1fe8e15adaff07cc60d67ba1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c165d94fb369d1daa54ffe93cf07e70aabcf3399791df7a39d088dcbbfe1e175 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..367a5ad080e9ff9d4a1e50b82f0793a308b4dd2b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0455bb9edad8017e56505cd4e665158ec858984d842ef515eef717fc66f2c72 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..64bd20256642b717bbd7470d8e8741caf37f4f4b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe62cdea62e99bfe8b21aa4f18805327ede3994652b4c2cf72a071288011e5bc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9762e66f45397bc518d5d29fbe57116d45b43619 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:308181bd675f5fe07c6ccab24a0e69d0a2c8ff006f99989cc60f3d00bda94573 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..965b2a03b34bd00bc78f499d6e4c09e2ead94cac --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c67d9f07e853fa4f3e432c2012466be0c776e082eba7c120dca3b92c65ddc52 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bba6a752fdc716ce305c9995d0f122f0d3b1f618 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e04ba9af3e72801659090380c5924dab5889d7dfb6327559b69550cc2d0079cc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d2052f3aa8cf9e8816b88e153d00d8c6f07ba82 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bac41726aaca3e7fd0c0e5d06c0de15c944cec57debf4c3291a6d1d395ac897f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.21.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfacc11c46483f94e7cf51d2c4d2847c638ca5d0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ddfa3987569180e34cb445cccc7ac3621e9871793a57cfc28ed75333514f97b +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.21.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab3d39783dc95dfc0c2dd479d8ca192dcc325e6b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d74e5814a8068b6a19bc3ec97d5df38957f209a99f9635874238b343ca44069 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.21.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e132281854defc9282b32bf675aaaa170ed2b6f1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee23110b20070f20e0b5bb3afd9ef3592e33925c0d1ce3aa0ffef47bbc5f9eab +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.21.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..70b430208f552defa8d787cd8e73cece392acb9d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c371067190761aab30ff462df60b8a9a0afc882d835fca7a80bd0074ab9194d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0676172c0c3cbd98a7bd019dd055253cfd24d09 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:928119b90909afd4ca336b38035fb68c327d4f59500be3316af085dd27fd9094 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb383b3b07a0b05d59884c6ecd0f400b73835313 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbe870f339438c73724621a9c57b77846042217dd0c02baead1025e37358970d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b1a9c090124c0c78284290d300e4f257f621dbc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea6018b8a6d6508e1550455afa23c9d69ffba4d9eb9e0bd97717ba907051174a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae09daa0ffec17e425aff9e9cc01e62ef1468c11 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb826aa57d4d18ec0bd55d9d07617db3c073d1ba29696408be1f5b116d37d655 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8da6d63e4e4598afad1bc59588588ab1a62686d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b7884fe15cf066fd2bd2f8c99010cf1e57da14409ba4a701a4e535821451be3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca3839aa05d759213f4075be2d2cba18a598c95a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15516dcea71f80fd4107a64e3ebcfd3d39d1d428441c1022cb204c838a62fba2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7124d38a97acec93088941569758cfdacbfedbe5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c63875104eea59d5d60d858a9ae94d09ca9a7a05238795fc4cd05152c44c46eb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f82281fb5f33fafbe6d748ade68a8ffde0858bef --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06442e66c4b267e5e37977b20b453700c318cd8fa948b759ed5410ec1fd1c283 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.22.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1017042f8415644206e2dd00855c76bca797c171 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9b65af414214440325856989e4ad83e0e3211fd00fe93df310a7c4293716f74 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.22.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..15ae0812ae5d6cbb20b5f6a5e053d17b14531dbe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02ee5bb35ba2b9c95ea651cdb0f0cf526a482cc9e52509155f95c8563a1e33b3 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.22.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c420d0a93593804b97ccdb9533662bc925b084e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeb65432838e633eac119d370c981f3b764962c2ecf89ae328a2b1d9acf93a58 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.22.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9da6274b36c14545aabf1ab55279c7b0fa4ee99a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba3701dba123c6a5f1bea361e14527b52d4e49c45ff5ac41eee7499e6edbe13c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e78ff61212cbbbff070f44dded0479257d6108af --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98494b92104ce907029b543e1f81ba43d35ff6868fc1cc87720e7eb35eda1929 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dddfff4d7f1567c07c948b176605fb82338440b6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39480f8858dbe5c1adccc2f3dfc9741e9cf3750b5b4de70363d3861fb770059a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f95dc6350f23a12caa19cdd9c5f50260a4a89dfc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a87455126985e606b898b5273d6dabefe42d833a777a2646cee50533d445b8b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f00f104972c31588e607413956e042cfa661fb15 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a657b5dae2d95381a657f5e180ed8079d6fd800e3b5e812d606fb5d8be54d533 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e4345e3de2fb466286adde3df3450180595e673 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64cafc70a83fe9e02f3a19ff155106a96af0ac020e95aa2c996745030eee461d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee5d0e36f739ac67adb6d5ecd3e735010e865ae6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4178139b28def5fbd3a81fa08b5c13b6981b0565fb031d09c329e032a559ea1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b15aeb9c5abb6c6ce60a3e1ee4748d378685863 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25d161b6a7f856c6c9b738a61c31a40c42002aed9a26e212ca984fccde47d08e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4a902725f18c9107477ccce335f75bf7c710b27 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eaf21890032c48ba5aa0a433c50a3c58bfddfae84c9853522e6da91832100db2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.23.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..035721f67eea280ca9b59303f9aa4e4ceb12c85c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bee5138dd07f2c43c9e26fee51c3119d79b578db0449b3b0014dc7d912979abd +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.23.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3799c2e499c3296eeefd096b82128245721d5149 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3daa68e39bb495030a814a16a65a0eaa5e518fcd72832784a9468849df773957 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.23.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c2b184e7211dd7170d3c7b851632634a3870b24 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3d15283ce94dcb4dea29e519eb738cb2aa9eab068ada6ac4bd38f9f12b2f2ac +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.23.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..28cd7d1d310b185e253522ad947cc17065aca86f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75a48e85077c123ff60be7f7c192d40ad58a30c1ad7d01a874e851d5b893d4df +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5d591abec0a30e1b589846e75d3df10bd7ab0d3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:216a850151217a8f5512acaadd8b1fdce17b793557f64bffe331d97a084f67ba +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdf3f3a878e98f970d70657a097a1c6ae7b42cbf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b958fcc971d21e67c679cd14e9eaee7dc7f757d1f4df471ac55836b2fb4ab115 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a679995197cae6ce2aaaceea86ef13cd4bcf92e1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8410e5464d8e0bbcb22d92aecc46742e7638ddc4789f9efc24e1612ac4e786f5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb4c4842b1199f1d4136ed116166e8f2b831ac80 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6704069d965134a40c806372e796d51ee8335b71a64d185f1c9c9fe96de6f7eb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7f381bd60009f4b13852bbc2fa70c8cad733285 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b3b5d48b214186d7d30ad6de19e83c97567fc36fc6f75519f0797b5317b328b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f56f0a35cc91f30496ac8041623fca75f3fda3c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:105d44ea8fd5543eaaefdb5713ea8169ce9cf08642557c0d759390b1b1f092e4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..eab953e38905c5ff1304294043ea208c0193d1af --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:946b57629ca029b8a940acdfe959ad23edb4a7345e78eadde8389326a958a603 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d417b1feb1beb784acb836c8111149ad737c2ace --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5f7290393e2deceefb54740ce8266501cdf9364e98f9d26b6453b5d2b64e2a5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.24.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1cc47368bf4732f48042282c56ee7d98c34b2867 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ddeefe7a001348c00fcd9df1cf95b077a21853443a35fd7805a64b4556f555f +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.24.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4413c789c4c8f2b9d5679135d8addc17afcc9d61 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9ecedd437585441cb7acc9b666217631ed5e70cf2b06a47b6c0302a37a1c3e7 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.24.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fe1dffa676782b7a81ca75ed925de3ecb027432 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31237719247c1f41d2dbf39b90380973c49d91ccdc87cb90c241bc53f58a949d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.24.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f3cec2bad62edc1b1ed900ae4cc536b1e870800 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:465fa27e240ce03a5e3f7255ddf9838ad2a19dce5ab7a5a5d4428330c3c659ac +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6126debed6ade0ada754ee79761561d2ec4bbb95 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99867648e40bd0bb1b439afeb219acebb1a4b5d2803c1e9f7ea7db861b9fa91d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0eddcfd5cb2bfbe519460deed577f23c329e5bd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb6cfd8712186e79973fa0ffae8ed887fbfd55cfe28546aba40dc1683d46e1ea +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f413d857c428c322db21917b0712da6655ecb90 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e3c365c6a01a109d418d6c8710cd3d91762c6698afba3b992e6b8682c6b6cb6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..36c283b243f84e8d09a5af7f38595b3a9cec955e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e11db5ae55f306e15d6a36620bcef1bf548ad690260f2b2af2b0989aa9283462 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e2326350a38811a8059eb4573d362a547412b04 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a4eff6d1ff30821fc27ff0eeb2e24f30b8361d1ba0b883b7d1d2ecbb4762630 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bf6227b7366be753a0f3e972e5120613feb47e5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0b219067c0c189d6e7f0473526d55dcf9df9e380a033dfcd67d5ce536f6a588 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1307cc6936c36fb90fc150a64355baec828ac3fd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a92353c6b13a5af0c8b576eae7220675d236ee795fd7501f7e4ea089b0d0fa1d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..baab879bcb3e017d9b19886c4965292d27cc3dc9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97a4cb51fff23a8b428f6f3867b96657c9863c81166b0744ff6cda03a9694b88 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.25.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8042b9332daada1a1e9ba0f3b4efea6f74906b0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d9653b4536b554a442025bae1f49ed709ecd797e256971b007db977e8c38bef +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.25.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c6a8e58b8a3fe5f367a21fa32b95516a97c1505 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:036251989d95333d84f66d4e2a1ff91e33d84d630e548b4a493d5d0add96a464 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.25.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d198195e7a77fcf10bf481138eb5a50ccfdf568 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16da184baaf596c4d282bdb0d3df1bdc21d9b847d974e41c37a4418cc16f0b3f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.25.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7df01074a431b2b256d2c0872faae8f75b58ac30 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:861838f45db232ea528f247f1f0b2500d91c453134b9443b7cc14be33d60d3f5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32800fcca93c4a8720d87adc43f694425ac2d1e0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c198e53798226fc9c09a7b7630f1178c0479b727c5d487f1d40fed23e244af0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae30fd159fb24e9eb7988c54d3196fbe3e88edd4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8fe848ae5fc7b2f9418343c38718a453736cf4408fb72644f6153fc4d2b6a22 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8f3c3ab9c230bbd4002be42cd214c441fbbf7ed --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:def661af1216f023c1c217792da36f1be8bf1340d64ae5aa4bb32d05c60c2864 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..880e99de4921b890da150cd91d5e61e62ae0aea6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a878ef60f77aac8d0bf356d0a7f858fd6e3c1981d597798156483edd5ed4ec85 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f20c6a397211abbdaf9264b0d3854dff3379d0c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a7dfb94d582368977f4989e28afad8b87a7af19237357ad68420a7ab70aee38 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..88e32627b614f5b573f4d72f51e7ac079d470e79 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:554e1da7ec5a0fb13a4ef1862bcb712060053c3994b8fc32e6adc8774a1089ca +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9134674d4c2eafa4e8f791732b2181ad1cda43d2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d213c96ba1ac267da485e5435b0de0f97bc3ad954c3c006f632a3aa597a36bc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bdeb5cafc0bf4554ecb2e30bf80b129ec4f056e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36f40428566483283cc6600a247d812a8a2de07557de2d94eeb8b79b74ae6b7b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.26.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..14b43028b9872b5289b9ff80c1a99e82dad3fe85 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1734c2a11ce3b6a191ccfca764caba0db56218ab26e1cda3ec4fec1d815dce41 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.26.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..85a95147755e2eaa72c17fb2852bdc64e2b18afd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbe7db113c22f2aa0d5bf13eac8c917d413cbea83b2d7ab567c731f8f5ffbfec +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.26.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ac13f705d960390cfa24f40a0edd83d2fe2bb4d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8201e946c17292a1ca2ae59a93a975880051d646ce6a9821d70705cdd528210 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.26.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2031e2950444455086bcd6dfb7db1a1d84239a8d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f48d2b6e1fb2bbd543e36239b872a0d64ef60d1fb924bb8cad40f1fa1f318d13 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8692444afc3470be1e59d74fb0de3878e78ff4bf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ff81766b82efba1927597b6bb668de7567931cb42073155f1bcaa78946e09e8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3386578852692f76c3df4f19e0c031b7c31eaef4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64798950549799afc589a6a5148f4f1beaab495badefe66b858dff7900f75a25 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..19d227ed9ebc4711b9e1c4adf3309676ed8414ab --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8619902d243e121907965048e4592b3afabc9af3627002edbdc7680cf276f80 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a16182295264ec4656afe0fc49c0356d0f0fde8f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f8a3873a561f568aa49f7003ff361faa7069d04b76125d9ae84d52dca728dc2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..31c4215ce88aac3fcd28b73ce8ee339a5a011264 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d08a820f3b2c3e62f2ab529602170844e8a9370f6fb639812d45d1cdcc7e977 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcfd19417454855026fb730b0ce070947994ced7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f046fd83070a624fbf6e95fef2d6041e9d48355fac75ada7fca30173428f310f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f8957a66543c1e71ce929877ae1e080ac4c22c9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b48f6c140f565b5c53a1ecf1d694fce8a9bedd7eac20cd8d24d9662854a5126 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbf301ea38e0a09ac7f7ca6dc2b7abc6916ff7f0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb6f98bba78e2ff5900ebec0ef9df7fbef2dfd88014df22460933c5bcc271c90 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.27.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d945bba0abc93739c0752b1100047c769cd29b7e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a88a96ad81de10544e5f5f139dd9106556b25e9753b2be4b81d4d1748addf1d0 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.27.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb4326c70781190763005e5256e745f0cdb0d130 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f8b52fb4e27c3b7b63f8771767dce6121bd95ab7f43c05ee6c5ee9f176075f8 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.27.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf32cc63234f6e42ede64c08a03e3deb2f920664 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4631ba4fe0b1e52b94d84f3b3fb5757451bd702496c5959a5039ce9b706d4a2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.27.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7c9fa02cec68a61d912d22eef318c0f3f88bb00 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:708c70c8172ee2e93ff5c9f1b3a068153f606b6763fc8c03207d5c1e74397af6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5197b6b078b87bd48ad3f8d7aa4a375ab4934e7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce4064a3c067c511da9346f983ef302a205dbe7011b7c7b2fce69cbaf18a1e15 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..522a392da1a62ed319b5e0a4d87121db6af57c7f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cf89c9deb5b3ac133ae1646cb5b392a51ba3f59f412b01e764b2da3f093192f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f66ff4fdb7f2c4d65a4f77f12c72e3960d3565f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e6526e1375f388e756fdd6de341221f21751dd3d67896053fecf66232317872 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f45522d0055699d8db81e4ba79abc993086450eb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ac4e46e451a91805e8bb0c994d9fe1b413459406ddec7f037eecfa96b11d5de +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb09aa8ea1e29d4e84100b42a81785fe3efef7ab --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f08dc9ebceebe5360ae516e0c74e1c29724f390e9ce51385b2ce1b250fa75da3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..51636a66333ca5ac4efa2eeab8b710023230a43c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02495b4760356d14639789520fdca89f6f1e952178e533e8449c1f95130f05ad +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a98cc77a186bec3705a5bd191685f361bb679c9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bf3f14854af4fa694005b6aad876946895553b27639398bfe5f3c24aa7f663a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..03f94717b8b14fa3feb946479a5436208d286d57 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2d311e7c5b846a9e932d4387cc3cdbd1a3ae24319dafffcf031645872ac6197 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.28.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..afa9efb05f6475fe6c929fd88ad194b4b0676aba --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1e5252edfc0412b882830255f696a2e3611c992b797071b8de538eb4feebee6 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.28.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6731dd106a99eeaf0964b2f367e3c510c3e092a3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2961dbd5e0ba83f5fc6e6d390c17c17b7875327d2608dcaaf1e326a361e4a6fc +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.28.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..129e20dcd0c8971238dbd7caa25b3c0e583a522e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18bb1ba625de49b2c40d3cc95732d2cffd4f88caa07bf06f30b18e48e4084435 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.28.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b847b36375d03b2eda46dec08b390a4ab4bda8b5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83c678497a312f91ddd43c2539808bbdc65a24077fac6b3813a45e8a264dbe96 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..28cd1004b6eaf08436aa346360c60d2833feb9c4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df2d105afb84d1d559c6295fa8082f8f11af8fd679076a510fd60a3285e84889 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..92ca13be4df48c3f3a47fb55998b43ed6b8467f6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60734e74122a6fee695a7e683eaa3d3f36f16baa5fdee50387e60d8355754ab7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec6d9e9ab48671faa5be55caa4ea87a396347cb8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3db8177e30aaaa8efff888f404648546f0ff9bbe0798b7f55fc526b85d27a408 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..78d08a6942e167ebb9cd8b562ba19e4b157f064f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75d816455066d3ae9c08a2e49c697d61fff1ce590e34dac5fd80d0ddef9ac72d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e89804c841fb038d344c8658e423c176d0d729e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c515406488a4aae712d74c339bfd5bac3736db683d0d643b25a30b2f574a958f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..927f89b231b103fe5409176cbb89c302a55f6245 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c657d38b81fb181c0346778bd27f82e65c1aa16d624774334f4096fb0901081 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6308d92f58470ed1a766843b5eea2dce00a8dcd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8e16582bb12ebdee01268670ba34e3249b7fa0dd94fb1eb669f73d82ba33525 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e38fec25e6b5e508564692fb40335b9bbed59124 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54c7b286dc3902a9ae3b398e34ab4f9bc2223964c3fc69fd8436c060dd2a5f06 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.29.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dbd2bcf627c3c91dae8a2648ec051956ad141b02 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87df5c0208434989e562156d04920bcac5579bf8f8fceacee0d465bdaf6d78c7 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.29.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..45071e21142bbbe718d1b1fcfbd9b81537a70931 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ca4c8491c3574df9324e02220df3c6516c3572b846725533ac28e8a68732b16 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.29.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4724afd7e5404adf7e518834fbcee98ad46f719 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:566b4efa7b7fb9f83a225059bdb76c8a17f60a3c253ab19b7bf66ba089da67df +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.29.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4338a9a5793c4722396467398e062dac76a721f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65f2c7e381dcca0410c2a7aa6eb3513e29a8b3b970bdeeb03b9dfd3354dbc30e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..469fb424f64281d2cefd7a6f5a39d9831abe57bb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37a4a7cc3fdf5155d4e9aba8c9190e65cbf15cb72b2341b05725a830f508dae5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7c2a40ead8f56c734fd44b9ae4a992223cdc5b1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17c2baf46dd4d20e187c4578582e73288d130f8b846b2ecd8961c9d77444c26f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca89402c696beb73b04428a1e530310ef027f829 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab66f3f5325ddf2d6d11c0ca83f80e9649551f76697ba79baa3df6cd1ae341b4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..085aa23fd38f5084eb79ebf5f6e9ee3bfd112f32 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e7fd75fc2a91c5d8b2e38b1ce11a72647eb82ce6890b69db98466849cb4c787 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..641337ef5b4ad0df83da6546a623e4a945c9ce0e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37273dec4755d22695a2b72a05a9bc73c4f41e91bba8b22e0868529fc5812204 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e471b601948c608e3346933b4f05921c96f7e8e5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa5114116418d760ef7c1460e4c089b3a150fb5859e232425fe8708a3807d6fc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5006084d39a537800a708f1d710a2da7ef38c1aa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f53970b04540f3f78686b34fe517dc33d53ab1fe9f8bd9a9f383cc4bbe8719f0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3232c6e8cf23cae32ed7e112726b31b3b5db8455 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3fb6d2a9e80cbd73bcb8231f03015c768b82c586c663bc294d8683806aec4f6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.3.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..05455ec9f42b72f331a75f44247996bbb149fdf8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6744871474ccbba4d5d031d6b7c708c26d00d08157681d76b07a87bd22a82af7 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.3.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b88feaa4c91bad7d4209ea090c70d337ef426df --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16b19d54193c90d7e2cd1af9f2d15600184443a84da4f47549b78c1a0a810e6f +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.3.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a743d8ff0f8e9878de1f419d2499270df0c78e6e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f00c906397060c34fa84ba93d51c42ab8703e6ef667989e564554878e3f60a26 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.3.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8ef89fe480bce6f9d57e3d93021a32fb4d6faa6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:936d3cebd98bde8f0d29f710cbba5baf4fb134e8857288ad83e7732949e4f91d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0398a054327807201d859f1c40beed95586210ad --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52f9e7403179b89e5e359edd2021131e723b82a6f9d589eea5a95e383a9fb842 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb33661afabc85e5bc245b76c4bd370f35f59f6d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d59a5151c4cbdccd032b95d500bd2f6d8d0136f3dd490d4ea05de9efff9f8d7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..31fa02dba600720869ffd18bb17327167e85ac61 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2800484111cc863bb6da5fc7a4228bfaf2f8d49d53389a29fe662c4168a884d6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f689df46b2b90c4b365bf8f3979fbe324ae025e9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56c035b99ddd132319d6f3425aec8434842cd5deaa7a6f3e1bc11cee2c9045eb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..befcd461640c50998af8a67fc35a99fad54475df --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecf09b1e4f363ee32586125d1e27bcd1b3a67f874d3934f7ab9aa31aa8e5f855 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..01378ef4a77a1c105a16f7697d2589c391cfedef --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a30c111eb49d91716a08308c731ac0ee08ad82715bfad8272833828c9734737b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..649567a29e2f1a1a56b199576c0d29a71ada5533 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe49830d7dc2bcbd6c3a4a080bd9634a19562e2ef0a15f9bd8235fa2d39cac0d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff5cde6ed099b7266cf42c519fbe27148869d6c0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf7095dc310d5478e1452b0864f5609a351d60e78e51ddf8dc39e906cc0055f0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.30.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a654624a8400040582ad2743d50c779740f1ba9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7432ddff1f5a82f020d700abd9ca339fea5e8c1286fe0eb19e461f59fdcc5929 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.30.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d60493211c9914b0b26eb1ab0baf7fe5775cc99a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e53e350a5107391b7a0dd6d7439fde382d3a0e9bcf8a1d34b3012c6ce3c544ee +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.30.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9157c8d7b106e5c3f56904adea50cef6a2a4e247 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:786db798f9552c71503308b21a9c45dab3e959bd955b1c570a9381bbf0d0b40f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.30.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7cca87fba0867684ae8fa93af09221c12573fe7f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a199b8a83e931c2ef5bfbd2ef3a1f7ce208541374e921034d69af534ba80e8cc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb6e781083ae18677e2bcf3ea0759556f4f35cca --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0036cd4bcc9e135024ceee78fb545d4dc7488ab77bc0a30248e4f483edd4e082 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a669c30d9f3fafe41e0ab64ef67336c53506bbf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1acec06d25232b50887ac58afaec68171c83f63434bfec54e555fb41affa4c5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..407c7e44f948fc04bc7a0d9a6e2d6f40da3212d3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b242db93415f83e2d9a0d7eee93da1f0add4e0071d1af57a7b6dee58384ae76 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b4f11993a5d3ef15b473eb596af6571344af59c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5048741c655c4aff1c8618d9bd3d5699a9b7054942d80248b20cc75647b07bfc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b51d28b77f0842a0a66fb7ae3313c9178a14cf7a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af8283eebe9b577e3f4c1e75a35ed881f5938c5be689a919a4c0d4210382ed2c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e192b433c1fc4098038757d56ef0127b993eb370 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e56b21d1643e9f4ab388cb1791d5576003ad187f9899476f9336f6ba046edb8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7747655d61f93e16f60044c56568155b39bc944d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b554e6c341e832a6f20970117ca55807ed4b31c1afab917883e8da3744671825 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..10d1b4e530a76c4741867738b0519ca11355fd9d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d957cff63e94d25cd7bc167dbbfc73aaafe8105db039bc8d0ef500669df577f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.31.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..444a0430de35ca114fa95c7670ae18dc25918a63 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:486762c038d4f9db971c7790b67d074999a32fddf7bc94bafbe3fa395b5dd4c3 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.31.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c026703688dc6b003393f78a88fbfd5d2dc2b5c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b932abe2fba579e4fa21109aa1535fe72f171ea8143c4e46d772a779f96d80e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.31.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b8144c97ba5352d847ed240eb831e0d93d7cf1b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:077eb2f19e8da519f706bae95e96de1015f66e3163478ea1de974d44c9c27cd1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.31.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e1edcb561c8669990fdcee9234cb078dd5d1c80 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae5b8f3dd01546ae442010c0783bfaee9b41fdf390dda76f3786bfbdca0efc60 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d217d646267f0a84339a77c37d18ba7ecdc58e11 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f748fe688cd3862fa07ebc5d3e7c8529d251ee683cdc73110b8c23618b50ae8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..12e93b5aaa7de04040741a4d74eb3cece33e5712 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:368e938ee8783e5c6b295b9e83db24de94c607e20baf32a5f8495178395bb93f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..647c2b3974399d5ab1e0f57d0007a7893276a230 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:214cb714d8926f2c9dad867a59a019da673baf64e5f2d91a2fdeb8a49c22b49d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1707abce168382d5a6e958629fb03cac56c6c97 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94087912977bb1310dfec9dcffa8e47238e7360893ae6b07a8c13502b37d3002 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a5bdab040798c173d8720a829fde3d8dcc100f8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7637bf51c03186607ff98fe86926102b03e2fd73d574a997e9e5522411c247a1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc106e5d3965c61533a6263bf48b2de7554d8643 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d3a822bfcebdcf1f8d08a3edde71119285c013cbbd4e0b1f8e4395a38c055be +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..77e046032e0eebaf3e965182fbe15ef8c66932d0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edd90285f551d9d035384e8442eaaa63102f4ab5bc6c238244ff48ef3f571096 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..34cd3e99060bd83c5099cbc1a49afae3771e47cd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:132f3bdb06eaa1de03bd3b3724f882d25c8aa250afee478f894bd9aa613b0b22 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.4.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac4bd98f811396b603b2c7235572177a1ae7c196 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f08ab2e7b79aa53ac9fd0b662e8f3cd9487addd69d245fd7a3300e330358136 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.4.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..53098abe55319418de5c83c1bd910b498ee3a7e2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cc5ef25af9fb3252f31fe09fb2874802cd84f3976480e544a9938f8ca033b40 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.4.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..510d3be398477b48ffeaaca8525b546c335364e9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4e29b3e4307afbc37c45e6633ed2cf97b28107ca45dc32be7dbf0d2df9ff8ee +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.4.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a9f6efd50d8131303970949cf44dad0a828caef --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76873e049b761e4454c5c57fe35f1a58b9384396bf298d46726c8011014055fd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8eebc1f43c4d3891e0f65913f38f4025df57c5f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:038e9dd486208debad1248ac6483973e006c7947df601639e42aecbf019b10cc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..247ac2e4990e6debe481cf9928a041a6834bcccd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90c2a5ecae34b69a086f488465440a42853ed868c02a418bbe3e13c75e01e90d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..707112cff0f97927b85fd4dc2a24abd24907155f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ef3fe3a127f2cefbaf300d08da78989b37f3339d06119449a7a95744368b1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7b5ac702845ec93ac3949097833c74f93418b34 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84cd32fc316ae6528b77ac32b4ec3b8d44ffd227c56ced5efd6bad618795ac78 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a67e8e5a312517a602defca174d7d231e76f2f2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0ee2522c14db6aa99afc289057afaae43b43fb6b97ef3051c8b7858087cbd5c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2091f6bdeef69e76b2a573bd3dc4710cd478a930 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4dcd4a5788668cbaf08d56d586af61bc4c45212cddd516a8091eaed19c2f452 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9c8e997845580f34f1b1c64854a6ab3ea4213aa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a81bed032a4fdd2087a04517ecda30218762846d11450bca3dfa495870a81d5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..adf64e5c5b664a67036e6768d6502e7cebec0bb8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:726f18ee07728285e277803e619d2e41398c0477448d19f57943223f4a007f39 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.5.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..239c61fc72cecb5d4b6912534524445e7de04575 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:250a77dec05b34a9c164c3a9fad5a3905291624e3dfcaaf417c2a22e8b8a1d97 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.5.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa4165bb53e29ac9e44cddf24b43f0965fa7b381 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cfe02f0bb6863dd86e86c949d3dfe186e62745e91c3e491b9fe890d70743d5f +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.5.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e40ff29abf7c6103ff6ad18d45c0bff808bf623 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d18dc8e48b5ba072a480ac3a557d985ea5f91b20e006735acb20aa2e903bc228 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.5.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1835431dd09290b4e3d652b60aabcf5c875121a8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63fd888c65604887a327fe049f5c0c789d7c9db0fde6e86cbe59e75209b23be5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e45b8777d1eef01b2bd5ad92374355293f33e189 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31265e1eefe19d3042ba037591f1c314fffd85151fa2b977efef63de571e530d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..77b6d004f3698f60e5ec186e6246dd9019d6e347 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1e4ca062c14cc7a346ce83708ce02866b3b2cb6e7f533edaec6636f5bdec7b8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..969a00256f7bb149b74d942c61be843b0c5ad2fa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e7ecef36808121959ebf58a9e442fca317f536cbc34b54fbc3ee135c92009c5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfeaf3f152322d60e5f0eacd5c9947e234515e20 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9eb662b9d59c5bce5f43794445d59df93c1967cf9b21123f7e37e1b50ef444b4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3d460d18a4017e108cb74bb43ec72e1ce3109c0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8257c4a87020147c6c24b78929180b765a9170a604c5890887dad55347116163 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9d1f83fa499fde99f5b4405e0fa5b4c44cf1860 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47363b2f5447fd2979250a50017ed85ddf99e1cf0f56eca57f349987463c2772 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..736f3539f883ab5c15aaf596f19adb10593cc755 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02d056648a13c400b937da51a2bd61a9b913bd23232f4a945176642e4b4cb746 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..58ed2fd43c75d7d90206c9640aeb51a5f2af089f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:378d4aa6dc5ca39e2c02177d865f21fd8ac574570183dcbdcb57f7d0ac0ee275 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.6.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4bdd7b3f5b777fa200ea55ce23faea4ec3480d3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f1b835b0cfb6b8e453b5285db26ea5a2a78f4e3bd60434d01ba7093c7741627 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.6.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b9a1b72deb8366a6baad098f55ecc23eca683e9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e97f7cd1c287552abef16c01b6c882c2cb309796574768861b2fa983bdae10e3 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.6.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e31abf68bc93d05ad98f0fd68557cda07663519 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c515f53c6ccad3a454a90c4d67d7121200ccccb872fdc5859d8c2e6842c70850 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.6.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c31c73d8132b3542428b7688b76589938a8d2547 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5753a00c70e2d4703392f955e8fe6376f418c2dd45ae7243a145e4bf4c9ec592 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b0c6acc6b7abe421d8af36463e17dcefd3cf555 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5801b97fcc69a21177136184fb673db3bd5b14cc152d0b2ef15ee88211ac8a80 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..33d3526fea37a582b5fe21ba246b79a8c4a47380 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33a9a360897625e415bf2bd01683457a0754657e2e831d21b46ad7f0ef58b6d6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..446f0a1c4a2b6d25fa4ba88d39a4afc99fc50113 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4f2079011cf99514ce08c1725f43c85e29d4308187e6cbeca7d0ff5d61aefe4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3db26b55e8fc6883d6afb0144437e7955116ecc3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74beb189b15ac213fd1a4a2f4f7f7bcf2350391e14bf9b18a653fe20683a64f6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5a0d3ed4bc6814d08f025275ca1df56b6807480 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8861ee42b283be854b7ea60829ddf82f7873c736af382c7182466fcc2eaef010 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8476507e87af2edadba68897e8812c021288900 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6972106384eef471c7c87e45848d3d79b4d0521269ff7791b1e05c941c572c4c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..559d7b2f029503e7d072114d83c26c82d9488d20 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1529ecf97b4cfaad5b539cb64131b9a123ba28cd8679d08e1c307fdf805137d1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9eba18a794073f520a575ccfc0bb517aee9410dc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b12036c7ab191660ebddf7d9747b112e742159d94b3180c3e7e1b0acef720e4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.7.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b95099b1145557d96c5538b99b825d814335368 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f032ea05d8960e3090f62c2cdab658cf916b22caf6a60f97a7f856750c93b9ba +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.7.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d9272c412a09cc6752f912ba9f78cb37d94cbbc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bff0677800cb3b66587a29699402ee32220b87da25360f71f671665197061eab +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.7.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ec1e0d92b1f1227d5e826247e68ad4e7378c412 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bec58ce25a2a7b71f09f2016aaa6b3a129c3ac2309d10123db50357c27fe5bb0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.7.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..42a54745bb00b0dddb652dfd0b3901766e9c17c4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9467d97d282ca67a0c89ea79ab26e6149b8ea9641a2fa2d784dd1959f49c729c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5c7f5e10df7947ca8e18685dad352486a46d161 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fce686ae5baa0c3f7be454ddb293c1fd55108f1c2aacce8740b1dd5982025849 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f549fede6b640497d8eb3a2d204c2cb3801ba23 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:783a97c6239204e05e1b0bf1d218a61f0b1da34d89f15257486e7dae40428041 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2319da74912e6068aac6a9046d0546fb87d6dc9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1937bafa28885e31ad62253af01bcffc06506ea38c48094fc1b898ff9ca6924d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9b8e50390be41b7297426a4c3c924ecb19c4baa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f104c1bd55b02c72ed899feb9cc8aaaa8614b5517834849b989b6f7bdd0445f7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..214fe8faf205479a6e5398c997b118f53ed769df --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52e4b170bb576c69897d8ee2e47ec2775e603b1150037598bdbc94703fe96eff +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..af2571f5c8d27fada9df98a555e52288afba9849 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4be3d53a61684872e6d4e3050988dcb3f41f666f1100fb47e7cc812ad7f78ed9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..69b96ca564e945be1a17c2ef453ff5394b74eff6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9be05dd45bf34e7028cf9a34ebd3b738dc4d6dd5d74a9a38058abc139732515 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..770c84b6fe5f613a28114612975eb30529d2d585 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:975f7457708722872ce3138751c11d49c5ae76db5fed1cecec5f1dbd8aece1f6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.8.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..04ad57c4761c88124d91692cf8afd02a1ff01550 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e0ffa5c670871aff3f2b6f169830794ca02b21343197d80c413688c53849d2c +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.8.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e23bca88ee416eafb7c00de0e1f031301e9907b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e8b7354f2590fcf72907ecc8a8f56949ebec6c1fe1eec54ce02c115ba2ea7a1 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.8.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b49800e19ff09ae2bd35b8636143d27949d2bb3e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb37e8fa050ebe373c779f44f1971ce654432cbc966ac76d07f9999fac1806fe +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.8.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8de25ceebb20328b3187c119cf8735f142b834b8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a35e03add454d91c41e8e7792a21f90a550dcf9c2e68b7bab1297a979bad82c2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8484747b4f3f7609f4bd870cce48867f3559ba --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee3b3107fd36581fee29266b7513293a9e1b04eeff9efd86d2254e61d5827b04 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7cebadc6ea07bfeab440e7ceeb08cc56e6ed6ac --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c55966e9f6ffe30289a0f51295a4e1b6dc75fc58b02a6de6bae959c681b724d0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ab990e4f9294e4d64f4283d5c67712daada755f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a706ea9cff61737091466dd5cd9f9916e78af3139be74b9adf42ab84da25765d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..686b56e9a1ca27a91e3315d1fd77800cfdad2dfa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c7fd78ab91cf88d8d87cdbfc74356666e95ceb2c89446ddaeab073b649ea16f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..743989e112d49478bb8c09dc3dbe0c022b0bd736 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f73b021b8975064bf1d9966f913d66c7573ea702a68c833323edc7bd396b94c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eecb64094205a662e51fb745f9256f6c431af449 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86418dbdeb1c8dc729c58c86eb9f8353c7d9920acbf9e56002aab1439226200e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d855d4f2f7bd5f9814d5c8c69feef284d6efb04e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:648771e7a2f87e972f0f137af4bb184d7185704f0d1615822232ab755a7233d8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b7bf9a8c94adb9ec2de43c885f393d3a529d1b8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fcbdde514d8144af895c14b62ae2ed5a3be9615bcde7857e57d65eb5ea90507 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.9.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6043fa940b33450411d5f7fb937e724cdc44605 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8e223e6f18827d55f4e04ad7949d29d2d22e84c77d0b88a5ca5e977136b7204 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.9.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c6547055f88fe71491374c787a1f9264d0a6f3b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9baddc8809f3b858a4a88f0c85242dcb599c4a4c277e07f35422957be7dfe3b9 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.9.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc4b26bfa6dc880df6311be1069d2650f5e58271 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:854098bd4c47f56dfe01cd4cc65f3b2db4f9bd05d6da8d1d6bd49a928b5d7859 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.9.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2bba7ffe1f61c79cd8dc43983346221fe886b2a4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9d14c4301cf21e891bf216da9195ffe6458e40d0d096aec636dbe6965b61300 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e102f1e24672cab73a9e7c8d21e795a6d3bed587 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2919e4c120ecdbf7725d05febb6bf6ee0ebdc79f2ea2106096588c9427ba34d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..28dca2e8ad939e025582c4667ce3d08a044ad853 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bd7adfbdf51c493d41cc4d8e5555c31343f310571cca26e7fdb87ed66330b39 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e54db426f501af14c82f8b4a2823e99e3f92f90e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52e5a1b914cdf44dbe96f942a6fd63134d0ccfdb68f375f9f3b4fbc1dc68cf7a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ece0504ef89e0cb9106e2bd07ec7fc991b4f2d09 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13eb4cfc497e1ac87ca97c7f3692efed70fd19252b2113c085c89d9c72867157 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e104949a88266b021881d482fb71947b97a0f4d8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bf1117bdde55e519ae7db27245900e58ac1f72ecba32fb91fa4ca2156fedec2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..19ae9b158acbfa2084b40cc9a0485e32793f697c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76e413e5754644c7af65525b83ecf3b62a78aa36a23ba43c71b518fb02a70014 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e5bf6828ac3f8c5f576e712158a0a1dff7d1d6c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c9dda83c1bdf85c066f9f724b72001e78941bd2182de7b106f2f26e1df389d0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..926c1b85de0a704447a12f5a63435766099481a6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f2d01b45b627bf560f9db93cc6cf8c49da29df703cfe86691a246f8caa8e996 +size 11395