diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/lm_head/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..400e27e9d670a87b1c950985315fee980e98030c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84c29e156c1ff233ab1d70419ed039b29645b55825ad507a9e5af986fd4ceae9 +size 205955 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/lm_head/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd3c7df958de972e487c11367e9f8face012d3d6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9ee3f4a13db44f4511a62d1f34c0bf7be294a42baaaee4343e8bbf572e6a86b +size 205955 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a27685691676d3285f47294ddd388a801a18a357 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5f2bf8158d01bc5dc8e76a64a92d55d2fad186515b2ed2fb63aa90e8dc48cc2 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..82b280b231bc4c1fea6c15e202edaacc7dd84ad0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54c238861d6d07d84b5c5d33291e214ec78d11f98b29c806efa01331665a4331 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..af8c48db4d1150dedc589cb3752e4a7850c632fd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f531e8968d10b690638546541f23e7d6f2e5414a6f47034a50038f94b3dd1c0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..83fe0b8687440e4866bac8960c3f40484c1e73af --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:212eb39f1ba5917a56f22fd052b357884c704f1c3a2be9074911801596493394 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e0e50bb75551e50598d07261cdd5e78ba86d5af --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca594d0b9dcce98235d17ce5f0c386e35bb6751647416d901da2e4ca352a1f9f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e464397eddfb0f348aee422dcff909185514fef --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1de9232908364cb1f86406c42272e2288d7258ee895aff161ca11480318ee9ab +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e1d14adf4a7d30f07b1a4c43291c8b6d17165d8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fb95431a55747f44994ded0a95a2c2673ff4286a3e831a9c75230e4aa2c776f +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..139c19854e14c030b0c6d6e008b9ef8bdf7f73c4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:083d45699cea206c673314ea851bca1bf2c41913166becf5f9a46aedf69627ac +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3eff25cc4ab098e9cdb38d23a516672236b62225 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6da35c58446be6dd3e07125af10e1855c042049620bb77df989d6e5696c3c942 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6246817f8092b23e7dc14d55fe490718d9cffb82 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67bd452b5edcb7f799d2d81ce04a1379f3c180de4df74270c9f144199c97ab6a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a38399c44cea984b23d2542b2a22e8c5f1130e8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be58a3c843f812064c29ac1644eedc0deb07dba3926b4cac0454c4ad6c612191 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..47631f97547fded6fbf4aa2c2d4c878f64b17a1c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7064612c6df411d4d68e31b8a0dcda1837daf563142c5635ddd138f623540a3b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..329fd44e631928f5e76f4b6762db0c4b6c89fcfe --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd4b98c56cf2afddaa90fcdf1cd33546c5d63897e4e2386b88ca8aae4b83e316 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4ceae695ed5b00c9d1d262dfaed99e3171e37df --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03a3b8fb381d4936b9966d5781a22c2f8039a2c9740c7921d4fbd8d981c7cbfc +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b44f1bc95a6cb7d38553426abf5caf10b2f4ccd4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4e48eec519a02e8809566ebbc6482e5185e5ea77e192a31612b39981fca9f18 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b0632e088eaa7d14a10fb44b9b4c708dea94100 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00dbb96e224b1fc0340d2277092c33a781f3f1af75eb7cc75bc94b4162025425 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..663033daffd9502aa1cfb7b38b251d343e185bd0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75c6dae9d5425c411ee0f8110360086f23e6f6d47b652bb6ef771743bc71a77a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..445303f836f9568c1b8f2d2a6f471176e68b7756 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88f85192c9e8abca3d8dce4a30d5d896388e3a410ac669cfd612e67e4c11be75 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea16f25c1d83bade5f9ecdbce0cada29c010b880 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd21c4dced12bfee5768e46284e089e63fdadf92553f369ee92a4e7ef0aedd94 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcf382fe012dc504df020511267fc89f9d9b4f83 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f28d38bfd1c990589f0fdf514e45c50ba396cfea1c61ed9bc72ad389a6764a1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..98b621b4cc2e3b56b53ea41930e6605ff7b283cb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a5b172dcd4b82df8cbf6c801b3c0707f5af457e2445c8e742e9c5c9f1fa5234 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..23502f0fc2947e186a1641d3c6b4d71a4fdd24df --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b35c19e71b115e875d0c96a2a8305948155de4de7d487ec7c5fdc62723cfc9f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e79efe47a093c0f7488226c378864eef24974b97 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3801c3dc000ecc819f3fdb2989d5adade68adf9cfe4435d3bbdcf8d25945491 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e72144c375d91f1a0204e9b98776ebea7372459 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cb832aaa7b8948897f909fae2212c90ac6fba8b4b898f9e243ae8ab980e18a9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..88d6f16f4913b9d189deb1a12732680f7fcc23ce --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49ca9a4746055f0e7d227328c874ff94b39898734249a26f76412c731922e3aa +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..19b0f10c8567f05a1dcbdc641b5246e167b421db --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02c70f5d6e3a21fea59a0fa84ba8bf1afcd97a26cdfe6f78a9b9d05e1ac67eed +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.12.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b9c0c8488f878144b909b110622fb25beec889e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03ae6c337214d00566c22cac565d912d2dfa138be77a1c55d7d7c8ffca65fe98 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.12.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..236850f68c2680b2c23b6ff7cd3c91494ce45838 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a018a84dcabde0d91e70ccc3fe0e6de321919ed16eb39cd8c330061b2934a709 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.12.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.12.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1049d8bcb89811732fa313d6764dbf0ad68e5327 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:635e36ee83ec5b3813e91e967b5ea53d6399f08296e495922078e2560edc7b0f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f61cfca4b72d3c79b0df61c5694f4f1cb507f03 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3aa4726cb9dcccee614bfe7139363bf30f4f16112e74e2a2613ec1c61a887242 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a553d50a1af40f9060f384fd57fde4856b39fcd6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab8a37e59f79255ce805bf5f11bcfec314759f30594720575a90b554b6d6be41 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4fa0b523bdcc312f7b3e6a89a58368a1f352614 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:775d43f7adb15369476dc4c38d84236cffa76dd40c966ad0ca9d6cc52ebc2d53 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc3226a069a06c9f8e50f60044b067cedc55908c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:523df8291953be4148f3bc58b9f8c067ae8525c5a6883cbd18bf1233cecb3fe7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.13.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.13.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f939d0ad7b1b68eb5d309bc9ed21d451622c0a41 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbb54931bc24dc53991027aced2a8bfc67926ca0dd0860ddc94fa5c5f55d2d3a +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.13.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.13.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f59116201bf31beabb3443543c79dafa9c93a29c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eeb6400305a38dcac49b15c54bd975cf941870d62b00c05734449e0ff0928f9c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c31d7f1df131fb433f8550c0d48f35655eeff82 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:181bd944c6003c862a80c2ba65bf8f28b249d70a9db99889f851c0c3d48c6eaf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e0796025c92bf59586df6bc8b311597fa9e3f6c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a44704fc013049bd9bd398c6ae0d17207900453d1bf1f8d2b0396f55ae3442f3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d9fa3e98935465b8c2833c691d6a088c9482e0e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e95d2d5901441bf8b167a5d74c03e9a57d4931399e4579d28fcb74fe4eefbc6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3dfd2888fc393ba7cc03be6b614189b76da860b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc03e7e4b893c4b4ad75d0cc55764202831996b18f6a2e727f68925162a6fe99 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.14.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.14.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..907bd9a6b45f6506fd9c9744ab8b674aaff86b97 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:741575fbfa3bba96007c38b490877c775d88de67f5c358fd138bfb7a29aec8cc +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.14.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.14.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a803d94ebff4a457c564b37e9ca493e926163c3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59aeac5e1f17f7002f441bf7d54a578789ace002f3691c63e4597c8b323a86e6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b1991b2195e36426a8d5fb3a8085ac8587d3827 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17c1dc503ddd7e7c55479099b0ec59b28631efe3fc91c9b11a2b8b4c18a3ee34 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7f0e93a5b17de53be6f18cd6ea4d432a708607f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3118060ea2d069645e38e9f7b96316923dbe351dd020b61585fbe3906157cb0a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d707fd21e26142627acbe901de582f78dcb212d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a1546b9fbdce0ac1d994b4f000e714cdf7cb128c4b9e31e1b9900b058e6d1c4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..98a188c8c3c73c498e1260ce92c4e9e822b38429 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fc8910f0b0a17bda87c38931cb917e1c6ff4f677ec0657ca359a7c4811f1857 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.15.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.15.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff0cb4f977e04bfc0dd067f543027a9b98fe7a5c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f44e3e30e54ad4f12000116abde0d87cb2723d8d7f575eed084858fb1b7b590b +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.15.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.15.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c31aafcb8ce2333ca2957184ab61d6fd20c5701 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df6f52597281e2919c82a76f0864de61818a3be3b21fcc092525feb9c3081236 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..54ccc49565ee0e15c960716e724b861f5446c6cf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:914d6691d0065883e56dff16f5ad7fcafce5721e856faeb134194071382626d8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f40808497733f4c03d8521ca0c77c188711c4fff --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e273f4ab0a550640e21835f4d0f5c62c27c2797c786455f9227b8baa3dd92b1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..99a052754d7191ae2bdbd1208bf473b2d1eb3cda --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5261034e0cfd21b0ee1acb64ef96ace4105554a5746481be78374420ad03f6d8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7aad0f353459c87827d063b7e6f96185a22e6155 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd0ccbd44c4e40e4c70733e4d65388e429f3823dd904aeb0c6b3bdffa405db2e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.16.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.16.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6dcb9c40a51c8ea80067f33cc2d5d34118e3fc8c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac4412dfd71bbdc2fd93aa4c96acea3737a49519019fe494bc70850f61aa0a4c +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.16.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.16.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f03adf9373468c2454c2b11f6bd4af774180b4ad --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9eafd57108f444efbdb7186b9f86991a68dc2369625853f55a02b918ec89f48f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..33330e36ea4548ba8455d175d06fea6a9b3ca298 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c86ba886103bc9168348279d928e7386b3b8ee980aac00af4fbfd38914e749b3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b450a3341ef2cd36869404c33f040a622c95d92e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2dd73ac7d3b85e4b27b2e2edfdafdcb86eec323ec3d1dc430976f18585e74f53 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9d04512062aa0c5591d99c260a0587c319e56a2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52360f26148a531219f14c9b1b5543683ab0102eab4837122c6717a3145b459e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce17faabd2cef29b9865f32f343f3f216f2a52fa --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0a30b56f96f3e21a384c4c391a5668a0af19ef243879f2884e5a61cfd076ed2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.17.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.17.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..287a1b483ac24e5d8fecc3bdfc4c09774c01e9cc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d30371342dcc992d9537b82b371d8eb987c07dcca98c15a94d4aee6093e73ab7 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.17.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.17.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b10a06d25f760092946a192d9dad073275c23a45 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9598f78a2e63b82958ac70e6f233b06defd3fbfd58b05fc4ac0487c404eea7d1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3dc699653f677a8b487cd4355cb16532a3039048 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbfafd0c618bafba7bd4fc6e75a81f4e56a90710c01c3cb5492bd82b65595550 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b23117116b2445c983be8195016264eefcc435f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36288401996956c22509760187542f44f4c1417fe0ac5d5ddefb30fe7f7f8616 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..205f44455d2bd8e7932e9687819ce944afd6b309 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a3e549580e9c79dbde4057a503c5eb24f6034e197f9392ab373c215e2346e00 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6104631dbcb10e4a97b9608da4e7940804a4b42 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffff54218834b0e269c4417df65a4d6733af44d1c9bc631f6a5f9c1d06ab3cb0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.18.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.18.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c40f7145d97ae9ce8b3a8aabc34eb4ae76d10a17 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e732a14d4b2b7e7f4b211c54c0a19ddd01a186f4aba395aa904bf96a99749bad +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.18.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.18.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..807d04da6f124b05c85cb5d57761e42d13d2918c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c53edc23d5f5230b97221846ee9a1a037876dbe9b6797c2831674857645dd9f7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd42879267564b842600e24d7658d8d40e6015fc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cffc1098c120dc1ab6983a8b2ff692a768839638762eaab68e0b053388be1d63 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d3b1a9edd486e016385c64c3650e142c23857a0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aaf87b93d6429435d203f01ff50ba0c8680b2023714a49001c4559bbbd77c313 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..943b0fcfb442270ca18516e48165622611d072dd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99e7eb561384cbd9c06a87fcb7e8cd1c4697e7f3949bca44a35f41913c8f3b0e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef950e76cb740f83a2c9dc77c06c4f65f232b105 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1146ebb2c3df8bed45e7db28641cf8fb15d1c253ec767761fbc0afabdc16471a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.19.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.19.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..02912ff57caf8368ce1d829d1de6068dade4e695 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac485369460c430b2fbe7dcfb36f89917f0b3f73e398ad647fa73478422a8dcc +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.19.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.19.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8128146f9b15d44c482ba64ed1d395221ee132e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa937075d3da133203dcc3e8a2883e7cb4ed5f48efce856972106b8d2bb813e8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..db4b022a052f4aee6967a62884dbdc389fe6cef7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1ce4649cbd9087787e7a1f90bcd4301892ebc9d821405c18e393d0b94525bd2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b844cc157e612b0dc46f67356f5001da721990fb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30c6f06ef7e107c2840502bba1a97213c7a317a334b24e8b69919b6eeb4032c7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e9b898bba07294b01f952dfac21cb197519d12e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e07d28bd063f63e65ed367a3b1ab4abba71fef116a26a6c2b7db5bf742c0918 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4c6fe68cb685686f86ac16f4e0ef2b14dad5f22 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43fcbf2f536fd94f999567597fe0a57147eb90808cd71deae30cfc4460755209 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.2.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.2.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2de0dc628ebc8a5174c5685a1bcdf19f9035457 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e52ee30463374dfc9b739f4f4ba94b766941ed2fbb595f2f0cf63296167f7a16 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.2.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..41879d0823658e6ed813460566ff4ec9131e658f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24146f42c61c011a89d65b97de330abb67f038fb8ff0aeddab4caa0f1ba997ed +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.2.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..673681d18d3f548fa636220685c1a687e5e0f08d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29fbc4c587bb0abd495dbdb951decd735e48c066b5c8e194f29d92e55fd23818 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..34bb7d478f211580c27c568ff1c0c19344a47740 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebb6e76eed94e2b07e9744c1bbac0a421301fed68270922755b78d5e35a14074 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a46e119edc7b10d03cd48612e43ca7ac98e01f61 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:688274af6dd85e44383669909bbe08dbed707703326e0064677005399505ba0e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..092bd0d6caddc61707785c2213989f6e55ca0000 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8f96636d4349b89f3013881a19be93ce3f6c7baf99ffa8c3ef1fcd1060ea69a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe360b530630f2b37dcc25ff9b7b102d8f722a23 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a60aa9472a1c94833084203af287318d30d8877e3f13d6ab61837fa1e3464f77 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8703b6a63f804d6fcb0429baa3c26d64d3bc31e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55a7708895645856fd6f650f15a9f4d73661caf76db6640ec180b88bbd1342d0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.20.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.20.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d65ecf1d282204bc7dce87f91c538326b026fa5a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7476eeff01f0807354bf3212e027cfe57a7d8c0d6714f22da15ab9823b21efe6 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.20.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.20.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eba2ea39dbbcf98cd5eb8edbebae3a969038f573 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecf61a045a9523089a0715b96d715a39c1b5bbb38c52930084f83f0b61d6bfd1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7361e47d70b86bf327762f74b2f34d718fa5b05 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a57b4dc3079a9e4de7e7fc30ca38ed1124c9b3b0e571c4b480ed3620d12b761 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec140e768e770af6a164ac6d16df1fe03b23644e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b1d61bdf677385e46478dc631aa973316e5c65b15997f20d12393d8e6a856de +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9796f5da4e4c15c65cf88e21f2494589464ffc69 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcda9dd431cf6a14e6d882e42d16d273b5ca3c09d856cfead29123a6aa1cb79d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..72b4adfcf3f7e45676a92e620fe8729c15cd9530 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bc81a46c4873642b7c7d70750f653c7c08fa8270e4a10139a48bb3d07cb129e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.21.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.21.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2dcaee4608120b7b605306d843bb82b68251fb2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2662ea2ff33934f5d3e1d69d3cf1b4adf6ebff0f471815e6b326a912c9332292 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.21.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..182e5faa14480088b62851d137d6048216a59b0f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a19ab06c680f017c28a709ef7573cc1c1a33fd395398264be907283f2b767eb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.21.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..786f6652e226994a080d5fb3ccbb7c1f25c7ba34 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39c2c5680f89701f1a6f826e216f8b027568f65446cc08b03caf3984facefa06 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..edb7836c719cfaed5daaf1b2de8dad113397b446 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cc4d6f90850f0162c93c4b9abcc7fd3afe6e37de710fb648514ebe50fb8a552 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..33571f40a8e4ddb5c793aa9070df4042326bea9b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5f79a6bf0608ef2ffbbfef89002c29a4cf158d36abfe929426951a4226a1c04 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..15dd1acb13016f45802c6640084a244b28a23ae5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5db87ea62297a91de7784128fbcc18555a9d4697cd31f950911d662495fec84 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..32e64616255e1fd773fbae5e03db22ca9eb644f6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95571fc709d38edf89f3bfcc5844d52b9b9f987f0c262c8f6b872efcb5db8796 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.22.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.22.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c833dc9f3775d9f90d6d51eef3f558faf2be78f1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a27020a61351fcf886966509a08b3fc1c53ddc53933b2fb148f84be900d2121b +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.22.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32e450d88de64fed2fceac17c75eeaa94a27c02f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:144f28e06b43d22c184796b5c9615901fead33da1c40f24559479ac5bd56ba6f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.22.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f2f3fe9e158512fff2b8c10363e3114787127ec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c30f21cdf10f537aede0bc275eb72a9e828aa4e9042aca06be9cd8d3914086b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b702e2ce277aa727f682e02fe69dc5be8bfb4d1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb08f079452af06b6de2c98d482908991f18feefecb566de38e5986e873fd73e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cefd323606683968ff5c7debbd5dea2994918aa4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8184bcc8d0d67758df09fa312235dca0f0dad0dd5bb525f2c1476f8ba46041d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d9e844944176e0b455f62ee036321bce708203c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fd31422c4038ac54d2b564984587d8f1305b1052454f6dac03823015135b4ed +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..98698e884f3d03c170925564eb816cd2542dad3a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:772b7d03e7d6065d60c5b9c1b022a101f21ebf51235e783ed229fdc42dc4f664 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.23.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.23.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..31c9c46f92ca877cf1011f9452922c9cf47b0ea3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9df6b73c67a3778d2f613d9c837e63b2ef1712be787efef69783f381e4921b35 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.23.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..be5ff8e8e594d03d664c38c28fe6836976ac8cd2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b78950fd5da73218070bc8910b56efafa90a80fd3ff72d627ffd63b0776bb3f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.23.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d851e2aa9e0832b29347a5298682f924ec99806 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20fc9bdedbab535f5ed62f2960035242d6020e063063437f6b4432ab79fc2674 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba9fa704edd3ab1fd7d1f3e9b167c8ad74fc3932 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41667da2ff99bb060d13c0dcb8a12820d6cfa00597e64734372e85999f8ca593 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d90df2e1ad83106d31e44eb4b59b2336fbcdf4f6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:302e14de19a0ba426203f0ee33503dfd1579a6977656702c050aaa51bfeee0af +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..55db7dc6492217f8c04c65210b14aec2bded279e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b03fd3a2162a52808da092c127db8680b0ad77f568e7ef1e5940415920fcfc26 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9749a9d25cb291474d646c04b91240a6a26f6183 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e002dbda651de303b68dadf6c7b1742253fa43d89d710b1834501ebfa8ef7bb0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.24.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.24.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5f8fa5c587cc09b6329f9c2b72af34f2065a3ca --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:526506a017ce72ab7310c59d676f14398b21aa40b1763ac96e6f9629c8673ef0 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.24.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.24.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e8c87264ed01d7ac52a65a5ea54242819a397e6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:050e4b73af441df7da92015dd85c5a6e0e2789155b8984a7f639965ee347f418 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b56fb3cc890e6a0c1d62de80c83e9eec4e98ec2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e114b379044d8219324cde8326b3d3d3ed4f12f9b117a705ac6cc08a12dee05b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc06f03f0fdba24b3c3a286af1ae588866ba290b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a5eb9ff949b738b12a7043917c4adc85d53227cb63b535aefb949309ac3b025 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..168d4ece936c3db76c50ef4e10a8f161c27b5ed0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2e3b4d529f6914aaa0e3e05c5994b11ca1eb70437cd8e9c89c9966286193f91 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..574252a996c7adf02f202e84ea36c49e465297d7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0d38965f6a841a62f74920a771876dc36946a13fb4d20f4b12671688458cca1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.25.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.25.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b3b9e9d7dc228fcacfd4267ba061bd27509e218 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b641dfb16e056b0c51b6edc92d8956e6da213036b7d9a0a22743e05283ec16e +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.25.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e9398b0f25c68020008223ace002e3291fbcf0f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b4b0c9d8a640300cdfd8d7b70b1ea33e3637f2463d830774f8d663ceee0a1ee +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.25.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cfbddb2cdf418d48999d250e847da51d959baad5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:889a73471a9020a0cb736bce66a91aee0af5fd102121062225778efc2dab4aae +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..471d4994adbfe570dcb0d610dc6a189b95ed6c0c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d872d5f4940ec6c614021f61f86872f669a5525f396c08c40ca61f93c1c20a49 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f24d5907420b01e8dcc868e5335592e8a15b803 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:450b1b8f6d0945d69e648c1ff17aba132dabad412aba784d19b156127309b533 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b528e2f7b8e5bebb234a6421f107964ff6651fd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b13323a4dc26b4ebaff8b54b5645fe8258f738a6ae3b3472f89ec78e2db2879e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..12cc72f7d69356e6a0d64092bbc6397cb9778985 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd9e832cf9430a62022f9831e35314c1dc5fa8b86dbcbba30ee6799c6acda66e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.26.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.26.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c367af573825c0eb0ec45c109b64ea5939589383 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f00aa7bb06cb7d55a531ea83fd5ceaccc7d1a3a25c9ffe0a74da8a654b31c06 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.26.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..81b00da0e6b6a96f92e92883d864279c3ae0e3c8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb797f3bf869a67014f76a5c261df448e8e27fb08841b67b30489e8dbda7fbd4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.26.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..59ce5195df340429958c602bc2a68b100d912505 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1c4d45844a28f0bc14d14f2377bbcce9fedb5ee98b7ae456f15743bb2576635 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e7725ebf15c1786e309af5186465f2e9eac4bda --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ff2be670894c191ea9a0e4de12c8728ef2d5ea15cad788e131643edc8523b65 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e12191e5b395d220f10cf7926be971666f2f02d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad1f3560edf8711c6e656ee3c0b28c7c1a5ca704e9ed04a497120ab2c6f3aa07 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..282af25776b98294da9af0014ac1375c072c3167 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d24b8d5fcf0df242d88785400d7b258b39ee16a2c268051b212da0538dee9e02 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef04a23225ce8dc79634ac859ec79db5ed4e08df --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f42a819ecf53729ea4d656ad337d0621cbf58e77c20a5c196fd7b54deb0a6e3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.27.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.27.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c688b0dfc2ce0e5f8f8a78c95c1c73a2ef06e7b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:597388111e1e9a3cd3d80a991e57120e36788af06299652a7a68beb4707097b9 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.27.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.27.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1ffed8bd0a6541c15478ba47a019042ab73ea00 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c952bdd189a48f8e692418bf0e8c0030da32afe393f05d7742b945cea54c2a67 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..80628c2e6f7ffad55d78ba7932b951f0a76f2a04 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:732ded6cec03017029456340d20692524e72550005f1b442db08cc9f0c718aa7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..00424f4ff7dae03912273db170c9b5a08c71757f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:942cc66eb07dd35a088a715b1692a1e2ca54f7885f5a447a864fc31c39b3ab3c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d7239567b8f6584b3c80d52bd46ea54c94272f1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14b7229b7c3eeb3a17c77b634a2ebf441a767c379f22a985bc6edb2f860ee591 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3bae22b0990d4d6b4144346a157171369245e70d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96fc0461ab87026032a29864c247e77d7ea4f64c10098f6f13af6a4f8d241d23 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.28.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.28.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5ac51403ef546387eb4b7c656abab2600ab8015 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c2e3b39167a19a4b97fce34c83fdb5c2212a008a0ddaefaec83108f89175520 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.28.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.28.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbeda4376f476ee221e7482b87e13c26c87660a7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f52279b4a3492617ce1acc3e4e2150554e521d1a350b060eb552981165e371d9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c86c7939fe9c19398a8543cf0433bac51bd421f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:240c416c5a7451fdecd52bdb30b180ca2140749263a6ba40798bc1047d1ac2c5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..da910d9f1b02cdaad3b7c5951c40ef38ffa6f962 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7502996d40bdbdad2cc723be6436584077575e8dfe85db94d6849f4b878a3046 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4351524b7c912558b79db2232c046bb83f56f7f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43015d0c27bc79ed19f0a6e82acf6fa73f9dcc33b9595a66ee65685eb8ca5821 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..68e4445941a850c20da1bf55696710520f8fa86e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14e2274e15af62893e4781204aaedbfc670666e749c7ac38b9fb7eb4d4bb7e3d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.29.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..77f2a4cc8560cf5898534945ea34644e48777eb4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11d97d62b18407f7d4d84841218c65c310db0c61bfd9d6cf49a2b3a18c2ff47d +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.29.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..596a27c78872b7ff76d0c2e647dc54b2f9f02d74 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8340d3254bfe0fe906d7b1127b50f0bde18f0052dcbf5e5b6ce0b104412993bd +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.29.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.29.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6f82c5cac2bf028786745910c53603e360c2b5c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:094ffa931461de00a57dae498b6184777ec104d0fcc7bad513c2674b92f77000 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aad8c986fb58d632587e4953daecf0f3eaf409d2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a9e169e14f3e49f849a552e779b34c743dc530aa726a724ebd225408b8e17f1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e878de5f3e807c39f6aba6951063ee023ae02a7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87d68dbd9f4a4f4489a35d1ca7897ace09b5e8936f9e04e89e232d983a8da02e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6cbc2d5bef12f3487bf26e1e7220d0fa75dc6ce --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:249b3b5cb7c98cdbe6be699576b31058439fdf9b5363cb96924ade90e8b87c6a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae6537109714b78e7f204adcd7dc51894b5f8baf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8caf9508c90b08be41b211b9aa0bff37dff2c7bce9a33719f091df6c404cadfa +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..edaa6ad23ce1544ad62785f4f0ee4a8af39be5f4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faa75fe7fddc45bbde7a4dbc5c6f2debf8933f35ad97e6b2d2256262155c0cfc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.3.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0bc6d5aa94cc4e678a44329986b3dfcab7fcc8e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10323b4da9fc8ab6638a2238f2a9a939f3ed07c55a5d62156e4976a9afc17bc4 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.3.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4245c1aca07582f1e58d52b34f4756015e952e16 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:426e1b162f642a1d508273176d66f2180c53a46d3bbe1fbe8ffb36a3bec9f736 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.3.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.3.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c4573854fe72360e75378a6a8fe8164e01dae30 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:095754824ac4fd26be715516d77e68283a14755d0de264a28da6c99e2cee16c1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9bb43ddeae12ec512f1dbbe2333419be5e77515 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:473a88a6d504b118f3972c327d4d149190a3e0bf0c9a8209d3aa13b67611dd82 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..38f76f9b3bc85b134b725a84c5779138ffd4b54b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64bc8e20301bd50e1e66e49d4c1946a537a0857d2406bd9cd85ed599385a4d7b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d05a49f2ba559110b7d01d034b11d02a126d13c3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3d3b37ebb375119a4b5ad8e00a88a7db5df0f7c7c66688be2a3a471cafc7cde +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fabb0556c9c2122bdfeb1c4f0f485f927c7d167c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49242d936480acbf241f4a915e19bdeb02307cb4d7183a786af1ec3b72fe22f2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4552ba1de0b100351c63167944a1515806f16848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fea45a24769055f4e4792c79133cb5efe8c8c499368fc93d03e6a430a5832cc8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.30.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.30.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b12fcb5586f5e7b3c5161e50b57a47cfb8fc96c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:582160b153f18e339d14cf4b6d04fed30b09add1cf077f0cf88c97b91652981f +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.30.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.30.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8cfeb51ca62fa13a2c1342e5b70e4fbbe08837a1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11080fae5fb01f87a44d244c22652dd0b7d0fa98a8078ce47de02e38e384618f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b4adaf836fd1062c089c6f517e32365cc23692d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:702d36464d77120eb723c616f030c437f0a506ad2a5f761f773dd75192b0586c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc175f483d2f9a913556e4f49d1fa4e607b2a861 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2990b8669beaf0278fe93cac9ead5902e41d607c8c52c4b99507c42734d01e3a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7b6f929c6bbcba2c4ccec427510731e93d28fcd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:985d591c05e04ecb354c12b30747a61f8866eeda9e576f783031600fcbb7f483 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..17c836ca55c7407aabace04a1bf6b3bfb40955ab --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8e4af8da3ad7d850e30c5651bcdb4e7d39905fbdc4f6c665338359f574d9433 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0d26e141aafad228ccec80991fec6b45a274ef1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d725bd32958e6e6952d3de4f9d6de30c73fdd9e0947ec2b70b8114be4a6b4eb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbace19ddc78c4decb27510aa062f62669b3bc46 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6cf04597a39e439d7e81ef907327ede7f82780b252d853f19db0eb05fbbe3b7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.31.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.31.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca6a22c32bf11b69d87c1c713ff1776c360c1507 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03c0847a59c669a4240e4c9f81e6aca85a7e1964e76d1ed5cfb146804f023da2 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.31.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cc475981b3358e101ab815d29250ee721aa8ac9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec027ff95ed090ac78e4862b9f2b8ab465d65521c84443527df40406134b52ec +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.31.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9f7cad84e610b90e7b63663229fd5da591257fc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93f0b34891c29c600434f61fd58ccfa37b11a4ddc922b239d049e765e259fb13 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ed752325a99ebb99f46f590f11af6b2478dfab5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfc68273cd3f20827de2ea7294aba712bef7fe5d15b0fee0bd47b9bef605a8c8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ca568466ffbc7f33739d7583ef363ce29bf96ea --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:006a90db6d6d2e0168174e44e5357be949d587e9cd8a037b3df4fab3cc342864 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b02f1b82a3d17808bc6b7162eac22b859eb313f0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d065cb7aa021f27532eae3bf67b20e55e631f1fd3c41367513451b78a91efc03 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcf3ac8b2a7e73e97c066f8f06d3d7db3a55837e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a05338d99837a9dbedf428aee2205ec753fca4482e71a9348fe696863e5a4167 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..111c592fe267d9f4c664fc7d0dc4a60b7acb53ff --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:857addccd2c79d5fb5b256f0c1c03b69965e93638dcf8e780e6dddafda3e6482 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.4.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.4.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbf9ba689e7b4a447bdba9c9205f77d3a7fffe87 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:641ef2959f76b37d0e59d0778565db76f864f2c53114fdbcc50b522ecb5bf0d6 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.4.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..020f90afd963b63666db1b8122bcf620fdae31ea --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c7a74d8e9b013065ad4f9caa372a404bd73f993cc9b7e1daf02503f56dedc0d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.4.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..66d03b4f88b1253d903e239c8a08de17047774b0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c3e329b94a27e89c0ec2b099b08b09680c499c3081f06a2164369938aaf4769 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f28f10a62297f7a0e3c8ea83d93315ab60c31c3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c3d36f62874be01fdb0a8b1c2aa000bb706b0d1e900f868fb666491e97e7500 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4646991a221bd353493554ad89a4154dd957201 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b508d6ed33db9454088abc11aaac47e95837b49769fe6e5ef8cd46f497ab215d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5721192e8aa4d36abab31713a6b58350c0c7fe25 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7cd667398dbe303812250aff870a8eeb1f17087e63c15e2788f3cf3a954451f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a13f99b1e989252317c6306b1186c4f461aeb90c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12164520074dfc14956eefbeff68bc5212110b36209618ab7031aff09ef4cad1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d9fc7b322ac5f454f151a6f35479b648a2d6720 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fae61c3a018417e9173c14253d7ee600d7dc5c98fe9fd82609bd8463782b3833 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.5.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e85947d45c7a0e51c8c657880cc008e4151059c8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49f82b61442b8d3ecf729cb02c5f54107b11732c5a50045829ad03d2abbe23a6 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.5.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b338ee1fa6e74b4fc4ce74a3926f94e617b47312 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a5b5a5096ec1988deece7141575e91d439524cc81fcb20c9cdfb9ad1e95f80f +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.5.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f42b872dadb283a57bf750c3d087849ae9fd751 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f612fe78b30fe65de048d91e8d41060544119049f4b94efa41a4a3a5206abbb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.5.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c62961e38c3403b354fd17aafc77c0c242786939 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87ce254b3ebadf60f28213136c55c33d7364bd0a087ec3c6e0cabbf823c93f2e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..98a1e375ef24bae7e5d980c23b7e086dfd98f954 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:927783bdc4ae6d391cfa3f957812140580f5bb43526da342f8bd7034ef35d681 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c64bb1b8d38e3c6977983a7d6dbe2fb34a671bc0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73654300347922cdb6ccf85de4fbde145224f6a186df5c749daef775a687233a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..07d60748a9d30a6cc4d0931c4203563851445e43 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aaa7da1e1e2f8999abe890279e3eb3c32b7ec4dbece72aec43ba9fdd7ebedfc3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfc598a0ef719779b848c8978f3600c9c8aa4295 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:590c2edb2a4ee9a16a2656a28c3ed2ac3220d03543433e7cd82f08c723fe13e1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..61b42d51a0d6beafd72b4c9c750a153b7e938ea8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cac87096e65add990495b5384b6c0731952cb9610782d7ef2e1392a6ad722dda +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.6.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.6.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..82bf2c6b849e018d743c10f918149a1544bb51b5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a31ca3ae6d64781cc3ea01862c11c992b6cee3ffba196b0b92d1c09502c8be2a +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.6.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..47f48881fbd58edbdf779b6b0ad891e7280e996e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9b55e68c469b3d22d9537ed657f02aee6e9d25770965af4e92ea167db76f361 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.6.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f944c766640bb2afa6fc33942578db2600fa979 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7108a64d6f4873b0706cf3e83d19d89f5a636d1bd89685cfa59b51a11dbc2e44 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..03e03c38cfa3d25318aea79eac4c4a6313f92953 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ced86d5e03d3ddfab7342b09430782d18c9ee257e05a5e6530b1753a8348f04 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..128bbe2fb38bb4e993b6e2688807a87ca019a7e7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4ea234dee8c7eeef6f9b5025e893eb0d7ac3c69e862ca3ac422ab21302d4255 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..77371254131ac612ea62725487569e86532bee26 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a424e39918a9b318213b5430ad239ccdfd3745c4061a1e439ddfc4fe90180815 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bee7ee092ee90f0ab335f4df3049671b63d49831 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fb5582806d5fdcc1b5983c5832e9244091a9091b496309e6e7304af3e6d2104 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.7.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.7.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1af3af3a3375ef2a122c75d32fbeb2340d2529e4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24c795ed5430f8d618652ddc8fcec11c4acf19350dbde980dde2b7cb54a2cf67 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.7.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.7.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..37ca5e3972a711f72cb9927ff40ea802862f1e7c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:194a93ccc64dfda634463158dd7c2249cd143b01f1d19c3d946b75ebc6f209df +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9d9b695aa7fe1ef5ebdb682f276a1935b63bf17 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29bd769c3c3a67eaf9060cc90b89a76a93e4935528c03a9b642fac85eade90f2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..160d5f3626d27db623916f71cb63443b5bd6c4f0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab5cd871b16c543d61ee9208b7d74840e148fd85280038313a82de8c0cf89753 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7dd2f0c7fbb4d6fc31fa2d959f60e9e33ce0b416 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50c4d7fc0511dc31fd5c62c9bfdb0dd5a0a399e25c42602f8cf7c511b8f40a43 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..68a31dac259f8744fec0b3841b4802b8578349d3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec13ca16de2c2c941b2935ba33aef46969028e078b9134493ad6113af7c5bdf7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.8.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.8.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ad69c2d84f0e4a7439eff7350f8392bc7d19c01 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:762f459e87ce0706885e00bb8caa390fce245d80ea77f4b42863b4b09d4e03aa +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.8.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.8.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e68a9e480f8a187d6930e8c7b608fad2e2a8113 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0335157bb7a977ae805f59f9b1029cd4d87696480dfd4eef8c3e5d7302c96ba +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..86b87c89957f13fc8bef999a034c35fe421b0ed4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd6609ba02ededf5eaae71eea1b63fda0be154b927a1b32f737f5bdb096cbaef +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..61671bbb77639403c22aee27291686441943bafd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da933eba9d295393f8b48f4a17ed858c8346ebe4052e6db1e150f0e5f0d28db5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..285f9cf8d1f90a635f7892930eb938a9fad995c7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b376c8d9d586089404bc1056ef6c916b213a5489b552b02388ef41cf3ceddbf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b56e76d2600657fd9d3da1abcb71159dba4b7bf6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93543d346c2a19f8931fdd279ad38b6b1cebd68ee31e4a0fbb17b84013987862 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.9.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6b907dfc32066d7c8f6a6dccf81c849c0a6acaa --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5095d483d8b81cf4bec02620b2908723adcf781a599967c069f311a170a6bb2 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.9.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9c836315c8339ce1666126e80ee0e64bd433b34 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:250df55fc699455352ba7df82d9c1e4c52bf17c02ac7bd722decdc48f6c2da05 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.9.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..26dfc1542f1ec098479cd9a17cb4e41fdee12d67 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f57d74b8bc92382c0d05859571efec3f8f879b8e6702a0697a7f07ec14299d5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.9.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0dda705d7d43a569fb31093b8f5647ef306591d3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f72b90a349f6d73e3797586db7cc20ae080b805aee25fa88bb8ee408ec5984d1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1514ec8f616fb7dc0ade2003f75532a078282144 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c84bb2082b1c077da748abe2722f8cb92975d4fb8fcb14f1a0e5f4115c7077b7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7c833cbaa2aeec5a02887c7073d8048369aeee0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7277541fd664c9208f99c0afc2de2a4c9ffa51c1abf677e2040a68bb7f492f25 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d6ed43ce7b9bca20f728a3f1e412acc053af29d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3932591d422d73ff979fd7127bca0e53b8e49ef5250acf8a9965611450191f59 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa767851fb3546a133cf9e89ab85eec87f75680d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75451b2cd4900c4b002efd0b67f7aec075dd8c049702923823d5dfd80c276f86 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/lm_head/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..40b6f56d563d7a3faeb4fa9cba309e7cc75010e5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:300da57a020dc61cbb7e15f8958d41ae9a06fbb3c2acff4e294e32a1b773f6e1 +size 205955 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/lm_head/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a27d29a567e94f6db921bd276057ea29961ec02 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f91a79a05ed4c7ae877fb44461d89b675a4f8a2c3b1ee89b6c1d0e63a4cfdf18 +size 205955 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.0.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..01a9d972c5e9dc4e3d530c0559d93265171b6bd2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:668e2a18922693a59be7b455f7be0b1ba41fbafb8d86cc0d32b6b9e19ffdef6d +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.0.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d737e0f889e1d0276cacab823aa85672658ed9b3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d67276b3d89b867f813a807a0fc4dd0ccf5cbdb8007556afec069bae62b0bda +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.0.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f26472b5332af5241b4f216c8fc283abb2847a7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b62e6184a7bc85cb4bd034237007a1ee4694872e53ac876a2e49f95626fe5963 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.0.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0375cb6d69ca7b57995358054817dd4b97bf152 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e0cc027f9323f852a51a3c37051fa8cabb9ccae471116839c73ae840bef6fe1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca9eeaa533b12b8aa038dbecdfa9a0fce5b792c8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac53e9c930256e6b506eb6eabcd001f68399a5bf39b488399e6222afb8b7015a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca5eb8e63c1da6eafe8f4a8e7ee6bf88338b6162 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09e592e6c8429cb880c6c2488c5876f53270a753d1833ae6ad1498ac21307fc3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc4b00962c7f4bd28b36bdeb802a23caf794a3fd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:370a33c6242087fddb018cb9ba9af19b3258cd23396b1052b75e7fbc744967b0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d5873e0fffc94c9d08d5c409cabb890ddf7797a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:571786e0766d61adab0a56ccaea5828ccc8692e243d29d4e07e47e6736310732 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..127a77fdef8778fde1a4fc331c56fdac3d545255 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5227e72d285c92a9b7a84e662665c5a19daf64330361c23724514c59c7201b3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff7b4fd56309ec83f4fa21a5c458a79b9bc8ef2b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:748a89ca09848332905545d6d69cb615b8c56da5f1b175bc30e4c15d4aef8f4c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..96dcbd89e411cb9366d27d6e19c74d211aead512 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e30ef2a6d85c593c07fca59595c304d18f9a362c0f9da0463a7a35d7da3a15e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..979bb7e7eebb68474cdd2778011c513ec9c65efa --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:545687ef7e6a2413f294d256f10a76677a42cb2dfbdd7657e962f61536a4e0bf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.1.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca15617907870171b16feda68ac5591a75a188bc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f03a93462c8de528c8e2a4710ef84546d41c78ae2c9f36d2ee6803d0af8089cc +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.1.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4b0accce23f1086a143c47beabe2a8275c3a0fa --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16a6fd924a892b3d52c2640f6dbe9ca1e0a07cf1c959ca0b176d9b139312d241 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.1.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..46a023ac7fcc792de657908f18c101b64a9bb29d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09f8a5eb1f92d74a0a7212423ab073366fe1ab6ce908b81c13d288359f910b74 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.1.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f1449c8c77a91134211f3ec7d91ddeee2abd008 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da813d838637c161f1dba5377a3dc3ecd30bed19173bafcbdd81dc4d5b123e7b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..21a9fb447770badf6bb697438e7a937a29038334 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2efc0405d1f0420eada80b0451947eb3330711f25315be9ffe77b664ddeae48 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f0172b6fca28b496ff429bdc1f92a8c3b12d292 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:076442a70f13489bd9facc28227cbee9bd56b66a9b78462e07cb9ee448782672 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..81434f20314a00e0483258ff50e9db071f379bbf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3417a51b8afc1970b0699350c823a1e8f036a452983dababd17af906376521e6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..59d061bbcd3c744556f41eefaf266e606c869095 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0b793e7bec1e3bb47bdf6748481b732e7e12cd97b0f8722c454047320f21009 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..13f81391dd50efeb66d7ca75dc52850319e91e18 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1378c5d37a3f2379551eb861e55088ae1b03a8362b4f422f9d7f0b257e3bd76e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9694d9a62d21d3c1a2239745aeba75eedf6a496 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d069aaabee08b7df83384f9619a219df829b6ad4bf49354cad77bf4c3148f10 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2f551aae34a26a6ef0cf0b2adff64f4af4a3bbb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e40657c6fd6131e5b5f406ba76e05144fb826ab71e2b8e0cb2977e30e6d347f3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c000c9f184a7b0d46aed233de338928ccf5f629 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:487bcdb8d10b97d8f53e240337a4b60d1bf737143c7d5a43c5fed51c709d5d35 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.10.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee77e65fbdd0c2173fef0ac16b75f106130a0ef4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d42a6ca4481642a9c9405a81e5c29b6a791b9b9bdc8962e2adc0fa5cd02836e6 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.10.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..90a24828b428a34ab1f4c0aa09288ea50ec5a76b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f280f86e1c171a667db5164226f6e576e67e8dccc27c82f30f3e40dbd05365a1 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.10.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4f5384f10f60806af717366172751e643eea3c9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85f29a6f86b9b43f5a174cf1b938c1ebe45523612759da2a20080ca5c31623bc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.10.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..71b6004ff4a6d14127e3046b085b72fff35f33e4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32958597903eafc20e6eefa20c894c5981446f4a895bb8b2c0074d0df4be966e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7dc6d6e19c19a1ede1b2255b344338d83221b046 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a4d4d0d2309f7bdf31c6c5c96a30ab321902c1d24cdb87685d76bda2f94cbb1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f61a02a4d219d52a02d3a3d44aa78577bba0af6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0de080cd333af026c01c15b226ba09b0a05053268b35bb1891f35aa968ff092c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..43ee3cbcbd4d4be937a80312caa4bd522f0d7258 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08ca8f2e6d07b3cf8677691cf5b7710459ad2cf501faf9b113a4be95e1cf2aa7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e08292e44f1d35a81c09887d853a6f88c91a787d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ff83075f0a32dc73307d0ddda17013bc360ab4df4548a0c4aadd44583f58d20 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..da116db91cd58f194136bfaa7147b7001c7f88bf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:803c6d825b111bb91bb0159366b443beb5be13da576b3bbdff2c19ba6761e858 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..65261e63ea28786ccaa558fe6a942962cfe0019e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dc67af62d1b4774da509735b6afbbf9d7688b9e76ec873c8104eb89c0bbfa76 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..57716b5e5918e4ba1c48339e991da124938e80b7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05fdac230f485958b859f6f8a55e73547d270362b493549990a6fa4fe738c864 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4dc38f5ff3852faf7aa7422a110e6516f438546 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fad8f13a8209acadde6d2ed54fd0f409aa72cdfb7bf9e94718124f379c88f036 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.11.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..74ed3dd910664c1aeef15e76e5641d034c18ee10 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10e8f959fcdfe45a2dbff53efddbe58292cfc375fc56e13f9d6cd4473e57b1c2 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.11.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9adb8f107e5d3a5f229c74c05f5da3e2acdf6a3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:594da82193ac7a4afcfa257da567835ed57f2dac94c7185e232fbf0856cb9eff +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.11.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef914c3b46bc82dc1f13dff24e304d8e936dbef8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d1e27f9ea09804905a2bc07c612c7158aadd05ef728b0f7c2e797115776b47b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.11.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1251f57100327a1301381c100b82fad6d66c48ba --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8568902282d49f8e8c989474424a72790072cdfacce6dc7f77fd29b0ff56ccda +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..95b2e0dd07dca86f127b95080aaec8fb65e28d1c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d781c1f6e29b1a51bbefe6e1631dacefbc3ce1cf945ba39236d0a33669270ef +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdcf0a95df1e7297a8e47c96d2d67b557486e7df --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e015f22777aeb7c8c51370a202ce4268e05f8c5d63fc52ac335df3029d02ba2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..92b4344d825632d8d0f0d6b34b28bf86e4c73620 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81f40f345cdc64af51bf198f5e31861326f191aa98c9d7ea775cdc2e4ed7e6b7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ea2b35d2b4078e9422bda846161711aa8f46eac --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb25838477bd186e2f74a87566b5eada256a957f75c4c179da0c1293dea0d47f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c41784d6b807fc87c7a36d33b043438ffc14efc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dd47132e5cd88ce14f8df302603fe4d3f02691feb91556d7c74adee4cc84d97 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..15deafc152c174a95202c4ebedf70793381d5ea3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d0c6688b0f56f41bbd62b2220d0a69c2288770ae7b5808bac4535f37fc56b6c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..79c4f1b882814aa8e037fad7c18b98513fe41749 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63098490cb09b22cbb87319701dd9a3d8835d71d67379444d6a2df346afafaf9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba9a2e9326c0df8292c48d69c59497b255e842e8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbbd66ef458e2f8ee426347f1af928410eff21d25cbcd60dbf17d70eb6e16f62 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.12.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..681d79d0a0c1cac1a4bbcde7e50aa4f7d90d9870 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96b49b452a05557f5e43e1dc04a3ed67de0ee14951d646ae635c9635728e8892 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.12.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb179fe6b11fed2b8a86db3bf4ad9fe346aef083 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:818cb17d913ad91dd011e4735d43d9cbe0a86f1d786a7d5068e327450f0bb1c8 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.12.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..aae24f4c906afceb82e850e5c32d0da3754689a5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5370f38e5c6c5c63ea8b4af7015738f1dfa699d003f8c1eddf3912a75da054af +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.12.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..efcf15ad7b58e56909bf040d9b54b27d99bb153c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce23850797b05c3e527aca7c4caccbbebbc17a93866318ccabe8339453dd9e31 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d68603ddcf162fd7f5425d2491e723681af48ca8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee194cdeb67053c6fbad5eaba6717c222b466aadc1e5023ecab5ac874e72f3ac +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d36a3c68352605abde4c865511c87ca5383979bd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c9ac606f5df1f1f99c813112ecc4bedabbd0cd9c2f1ff58e9a9ee5e3fbb3981 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd34848b73fca669e70abbf451715b06c46e8236 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c36d77344cd676d03226c44f120b7235826ba5108b5db127e50027e9dca669e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..411e0f628b9f8d363703075ada8b315084301bd3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:108924c5c61093ab8be502bb03c894171bce7961f85069ef059155526fbaefbd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ef18fcdfeb1ee834bb2c788b1f7c22868342f1b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:806f07a049fd45e236140fafa75987fd459415cde98733e1704a10ac7319090d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b27fc194d64a68a8321ef0a2c062fe7f959fc422 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:206663fdce434003fa556b4675fc2adfd1b65453bac58149b001b88f2cc47729 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..144f5f7b2977a67e5db4fb0606ba14128c600723 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfdc1da3f7240335c7f12df9d70dee631079aee3c4d6add81fb582a309382a36 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dbf28eeba1d18dbfe99848a52a255387780fa746 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bbbf8b076d38257c7eb93c75a4fd19696d176e57da1a878e14ff3054f26f6c5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.13.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9212d2683da2f41170e84f309611a50851797642 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:944a748021fc19eb4e182da2e3a5a0dec6c17cc5959ad3c1bff4c1168566094e +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.13.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..73bd9e17fa87fc62e67daaceca5edc4acd4af3a5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1db9522b58309e575825a770a3029bda89d01b04e56511840e7cf6e945f07670 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.13.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dacc9853e9c1395a054e487b7c5d413e860a4f4e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2651cfe7ab6b6b8fc4734f19e4d533e87a24a525226ee94c434cff8c9158db70 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.13.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1af8dcb249860019e5a061d92ca6fd95c9c75bd5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a2501dcb6ab513f6abf584813bd6a065bd776a6f33bf6dc756bbda9edd83615 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2de0086f05515ea5f8654f6175f980409880c642 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5955a6eb3a3d421a7cecc629335f0afd3b4c3cdb3b06e0a764fbc1eb308cc524 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..624f2eb0fd83992d8b6ad830bcab768a972c0abe --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7e566f59caf583a37e696730ad8e97362dfcac1f7ae4b4b9cea3c9a8897f689 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..06c7c0c669c95923941416cbda93d7491b1b5d88 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6be7fb000f865f492def71c6b9a2288907c898d201b1cb496ea22ad07498c9b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1029effd6200fdf51c1a955788ac522a0f4b3abc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e91a06c6f00fb0b675a376ce4dfc885c1b65abdeb1c79ac508d63a4fa6120616 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d16b7507b4c4f3aefc658a5a1e8c47c62ea0c1ae --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:828e9c56a690577fb0df11c0f7cb270235922c2a9886d04babd0a5a6442392ba +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..de413ea0ab9ebe1b0fc81d50351bf5e00d3352de --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c05784c28cec5bf90dd709952b921422279c77e1ea84649faf6aec7d03c6ca7b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc20727a35e30e97dd4c38a2f3cd4ee28f36ce51 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e659268ed4c4608d3cd2de5c3dfb196f455373df7c0baa2f5cbf114ecf74db78 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..192c3b32c030e45c3ae9345e6d803b4e208906dd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13db82bc46ec85cccd7cd44b95ca4f5fad37d95e1fc46c6069f343b3ed86fb1c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.14.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fa1fd1b85044b7e2d61773587307e369dd50ab5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d146b8b0c441ecdfbed86366cb4a375cdf321501659fe1e7e4b67395fa46f50 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.14.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed87bcc6d91128118b536dc7e556ab06a9e1f36a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d874e9edf6726b299dc37398aa773c0fd936116192d698411044fa5c75775d54 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.14.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef706e50c07eed032c7a1544890c02e0df8bb5b7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eedb46993cd6bfdc462ec219c3afcd2be7658a46be12a340976bdf721ab1d8b8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.14.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d91e4d91e3778761b567e653b0f638efca44e53 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:547f0b82f0459ee6f9152feaf4909178552a9648374b65e8eb13c25165575ef8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ddb6a2dc2666661ad5a905fafd8ea8a453b275c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a471e9503337a8c37d2c6755d6f490138af62ca2acfcb9f3fbc59a0674975f0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b1c6187478495f98b314a0b2686848070d5cc26 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dfc0371d1c59212964ce5a23bd7ea7cfa61bd455643f7c055f6419afb9a4ae0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..232206658168d910c738aa6ad3c46d43f7a3a7ff --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a8a7bb7236b882d5c3f49156f28226dd8ae519bbe92a13cf47965c8ebb77e01 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3be28fe60f9389d6b4cb4362ac34e6252934f92c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82b072a31dda287332f47bd7a52c0b17de52e2679e75987675eae054ad791491 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..078072a29c85f16a50db896c8fdcc19f570a4d69 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96b802cd6ebb84a8e72fe11af2d958cabf6a26f74bf4e817b76343bb20e49d9d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5a48d8d52252d7d5e5fe789f91357a4eb990f96 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf5b63c49072fcf279f6de3ef37e89950240c41233f8aa487b37702a6b634a0a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c4295dcc9ff94177946eaa14dfbdbf12e64ed53 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bbbee21949fa5912b5aa78267e18836b3a13f4963f291defc002cb7879d6cc7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd379a6183513c516952a16161ac487512f84ad2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c18ba096c432a925ffaa07841813effd216dee58cbfeff943eb795f30da4395 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.15.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fc8a6a41bd78fe9f85584de2176c05202e09782 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:383b56061209552869c502c1fc509894940c5ada550fd4061ea885037e7c6fe3 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.15.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..280781efbc89ceca6c8c430832eca363cb946cc1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d76032fc4330ef84ecf756a95b7601ec7be8b2bc6aada7c05d67bf5a64ab9bbd +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.15.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e3c7aa678abd50dede28e87621133377617500f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e64fe3919902914911b99ed0057ed7cc33570219513ca5ac5e6db29b6320c0e0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.15.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7189da49a3565721cf68dc92b5025cb6da8a1be --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2300afb20a0ffc5b9d79bfa5b3c24e5809346c00595ec2bf0dd42c8d7ecd62e0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d38bccf4d3bb6aeba3b9978cb3e1e1df6a8f4398 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:156d367842b2c2975ee66314fa5404cc62c152bd4e6494d1b14832ec283694cf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c752e9694c789678d9c4d88214cd1155bb0d540 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38c7ddc99cf4794084679490f9260d8d474e61b4335f5c62d12ad104b7462ff5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3f127f8714caf2056070c6be591b91648e71c57 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15f970526dff87a864a72f5335e3657f505e4a0d9d97006687bce14f2b8b7961 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2264e7f9020afd03c6db7f053ee8ae650c9b0d0f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c3652345ae6037fd1ed6b59fa2e2bc95455c4634c35bdc2405d6f7945341edb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c9d513674e3cca515712d856f36faef6405f367 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6032a05a151fe1c9ef8d73d789a60d9d500209341ca930928764d7153bade83 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..edf823ddd05ac9f9844f22b8b02968c2ee09b9de --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b42eb46e01929bc045b7f72242848527a29986313e7eceea2e7c77e34ee8167 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d10ae06ff99394a199e164002c99a08925e3d0a5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8236c753268eeda7bd35dc485bd904d1a4ad893a82af108feb025e4ca785307 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..da9139f931c2c7ee5f8684f2333189cd8f7f190c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7bad9bd8a7e8d9832dd24056235cf5dbc9d85583b0bd27eb81f15d4980621f2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.16.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7bfad853f914ffd35c20f89c3fa3a183d553e7d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a6f7f328621db2bed67df7bddaf93de6e1ca05e78e4549b11b6a95056d1e823 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.16.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..727fb698122b52dab423553d3c0e60a08b7b2fdf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6b2ed8e464918975b250a83c2158517677dd84ae73c77c734882b0afd39cb61 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.16.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..51d0f8daf56f666b99e24dc810010ffc7eb5e7e0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b988d0cf4997b856c17bd202ebd7d18106a610b738c5eec166ba001e43b3b902 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.16.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf3547db4769aee403ce21cf96ddc33cd6a788f0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea96a9c7f16a3a147fd953c83929a48bdf36d0154cf875c25e2abaa57b20e0a8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc6793ff0484c1f54abd29161c425d7cffae294d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b63f0a28796a9bae7335475f8572907e9c76a8c73e75f7d72caa1930bc8a4ff +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..881be91840223a93adc1ffe47887f6e155e3ebd4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c07986234437453d6918f31db8ab957db25ed1bdd95c909d5aa1d854f30e165d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce8194db6a32ecf9c3f047432f0d041f75acb556 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3937a9b8a042c7a6ed02963056be06818bd8f3526b94cc54f1c00203bdae929 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4af39eb606262975c4021b88f5e6dbd29a4d4c8d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:104113c5a5e67abd16ed7a5e6ac60808c9976bb2d5585c6797dd36ea8a8754f7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..328a5465cd15ee8143baca3395490a9200cd422d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12ed2a55e9d410fb890783bc61466d71845d2c282f7f764ff32146f95c7a4c4d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dea8b0140c92ce27bee53e519e88fac83bf2ad7f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00d5e343167cf6a0f64239ea19ad1bbbe7aee167be34f87874b95321659b2e1e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d6299b824e267892eb0bfd17490d96e21c85440 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:189017175caf76b0e957c179f338877b71dcd43619ecbc87ae4c2f6d4d010e4e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5380c93e164d295ee3da378c46b2c7051fe478c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a03db2966e806155cab6c9b57b991e37c3b84837e8298e23f3b8c800f0acf908 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.17.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0cbc2ee165d108ed27dae35df205b9128376dc8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:893d28b68565b07aa7090e9b9f297e01e2c1fdf65cde94ee0774e34000ec46cf +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.17.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0f46b89c556a1fe6966c946166897316b9d1555 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5917e139d0e4634225fa54e52f32e0174d5eab1e9b06b1d41b7448dfb65d4f8d +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.17.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1abbfbe8db15ed8b193da5fc63396698e64a0fae --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:633820e90c1a4a78ea1634c6b6b373c594312bc611727c6a04110b4d57e0e777 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.17.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c93c9e478c450ac97af8ae0272ee4701f72dc05c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b67ce952ddae165a366946484fc574a02ade9ac111925f889d5c5185227494d7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9feff4956457b6f67d2eca7b250cf7e6cf38dc21 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e97b3951d28fdfe45dd37321408623d1f89d39403f46d3f86530ad495844ee7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..946ce0792dae6366bb256f4903f407c63db8b84b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dec7e4f0252a6581d65de4cbc831ff0149d2b96dc00e3189daa94b972d59d86f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..28868bd7bd3ee60d83e5ac626432e6c724b27472 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7092c5f1080a8aaec7b8eee8fb59042ec9f2031c6ec191f294f8fa5b5699456 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..80478c093446fd20e99e7d7c84a3dc65a8db96d0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:088a8a4c33c9879808965cceba6b074731e245e12b4c2a3cb7a774965eaae95b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7093d02a5b39651d0257d3fea8a71135dbdde450 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:153b57752f76685e2229be907cca9a30fa460cc7ba0f6a3593e2044286329ec2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..409afee330e7e89aac16d3faabe891ff395b8786 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8696c8281653be05d9f5addddca169fe27cadfbffd032e596592c9a6404e6967 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c0464d40d9233e290cf9118d0091a2b2c21c862 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf26d4b96530a35b539b16fdbbd2ea487dd941ecd3584c2aadd9a21824528ea7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0cafd15be6dfb0d052bb41ecee349194de9a2eae --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b99253bd201234e5609330dc67e10efd2cb85e72b7512e74e76cc4797a79874 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.18.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8264be0500dbc2abb082c3ff6f31db3c9381ebea --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:811c60112a69322f23961f387cb668302c0e169e134ea63acadf08d5994dd515 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.18.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8db38fdd82592ce2ae1203d192b94cd921d6088d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30bf7c152dcf03608d80d87771679be5be518818fd7a0a49e9b640b1a817fb77 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.18.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ad167e57aa9e1e93cc494c686c0da5327b875cb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5f7a82b456f0bd9aae2228e2e87e28b0b2c31cf1b5d538ab77281dcbe3835d1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.18.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1c7effaec1f71544f52ec5e471d285c61e48436 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c8b9e070e02863967e8b624455ac3f78e0eafb22bf348f1c7697cbf7b723868 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..921b55ae9f6d1868bf66b599ec303eba8d6c39a6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34f1ff25577e0476518ab566e73c3dbec4ba0ba3803086b81d0644ba5216192a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f05fefc946f0b27f5e1fcbdb673cdd4d3d4c06dd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35e76735001fc094a7644aaa935a14257902ba628f1bcab87a7fa06055b51374 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..52e95b2a5e0df294e096fcdec3891daf6073f971 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f3f8abdac55d0fdc2dbb8d608ee70d3eaa5e39336afd925a6f6718541211ffe +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e303c59691cb6855c222f0372628aa6b3328395a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bcdfd9522b8512368504637b0591f010984af36457092647cb75cf9908da17f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..476b9a4053add85002ed1b30bbc02dd5444a1770 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbe8aeec7f4354a4f66674b16e2261619b4edb3c6a8d5c2dbfb6ec3e4ba6b67c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d374a122418a67f3ba5cf47d24abf94bc5d23ce2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:984eb6d085b436a4b29b2e7954b16cb8ab4873bfe2ee95667c2129496ca8d713 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1610f73759b1f74b633e4a68584cdcb4c7bfe58a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f74524632f481cbf9fc0fbca4f1aed3a12dc191a54c1ff01773fd24eb81e700 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..22161cb4f3f901afc4b8202aec85e21de674a6a9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb24d23ad99cd89c09f7fc6fe16edc57ba3204966a318dc50ecb65d1b309ea0a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.19.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..26d674f1a960b88afd2130fb20d75180e5554e5f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fb1af28f7c31f3e5dbd17b1c2bf7c7ede1a389e49918f53e94c11bf11b9c52e +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.19.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0edb9dd6c458e488f97b1db6b0964da929bada5f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c0036c8a129335863fde3c853a099f692da38f863f148af1eea68050623c037 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.19.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ef5f1796b9b28b1c02a01f1b6dcd11ce722e84c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:820e4d7f51070fd453106dc6c0771e83de9b1616df7c9a771c4030f3e4c2c5eb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.19.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..14728cb1b047d8ee9562b7c0b781feafa8ba822b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:963eaea31c7822cab2cc0617899a96df508d7d832cddc886e832c84b6e660dd1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3865f7ed298964cdbb40871799af8a3d4ef74d1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac965a4f2df3f327673d8f3ea7bd7b910fee59a2f73c23e7e907f1d7f718b638 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..14b23cdd647f0de7aba8738009e4316075a40eb7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce13b0091c05f7de04af6d5a44d11a8772e0373494fcf8427afa52b2a678df79 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2b28ea4339d420aa57fcecb92ce17df4a24c2b0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2dde356924d331353fe7ed2490297ca57ce74308be583f858162e13c4fc0b68c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce408671ef948cb99b1c98b778152e618a3c898b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58e72373b5b3b7897c82abc358f6a9c3e33301d14f2fe7aa388e847b1464248e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0495c9a83da0b5a4c637500dc71d813b36fc1e99 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c1e1c1e32d623ad34e3e41c6da3b8041dfdcdc93f3f26dab4e2ac53ac27910f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f676eb33e2971b739614108e7c0a569b523f1963 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dd5e4da3b2e9523b8b5475f1caa2865e3acc0e9b4b41771e1285f5119a45626 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce8cf1f12e4cee9182ed939e9071314104fc947c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3f7e8fddf3212a1373170d6cf6bbdb81b11049a1d61cd3c793f57911ecbd7f7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4c1e03c2d7ae067fcfa41180e08f28f7c5de58b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2772ee737bc9f70f595de108de11e5a7cea1dee58c4d8c641cca0a6bce9fd98c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.2.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..09692a31334e0e031af54a83271df1327ceb02fc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e76fde65a6c1ce6c722e118f61b6b789e329874a6d368123afd4a323b4472c3b +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.2.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a07a2f03f62631d2929a25bf9c5bd636fd425c36 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6cb585f1fcecd9b1c7474d453edd685a7cb115bdaa3fc6ffedf68f902c07c83 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.2.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..001a3d939f2d083b47e173b5d8e8b96e58ef219e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8ab9f7271844658682cfbf1b822fba24b21bbcc8448c21508a4cae45be4066a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.2.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0bd703f20a6d31c16149277dd1e3f3921b331a8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86ee21ca20134c220ce02c6c9104e043738a0e66464c212b24f5d180543d6c39 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..022b836f6a9cc7123c14f88b4ae107a035ff5966 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:573399c01800271b4b9565647772a8e67b12fe0677c7bc3c06de7180babd8346 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c69cb6478c640ffd6dfffe0b88c5b7bcb4c9f844 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d7cf91b1c92049418e09c6f63354dee7f4bd10bb528282d62f6f3cf13434fe6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8469c855ddbe816c0068290daedb21b3daa3fd0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8c9ea1cc2856110717ff3773fadafd0e155cae5f4e92e1eb02747683008841c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5e677f27d26de58946bc8379781e33233546f3b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce4ee2af1859f322d62ae88d0ef90a93eff26cc1d6e3d21ab7f23ebbf8628a02 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4aa2c1094de7b09b5ade5372a2992de4c63287c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b96b9423184ca630b62433422ba0665ff20b402c6f1a06b87ddd9fbee6bf0f24 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..37761af537b1b026d6f5e9a939a5911330a23521 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e7db526ffb00f8a52970e10ba254321a05f9dc08e6dcd436cc3acb925744849 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..609ef2920c3e8d9f538b1e87ac3fe58160f02855 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f47c9c70a58655333ae00122bfb909f75ca7f15a2b70042bea7d995fc902e72b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b06ee39b0c52bc5e3b8f7ccace705ac22e754c3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74a7e1d3751abf9a4ec497d7de25fd34a409e1143cef61c3fa10966ed0d01752 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.20.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..212e13053d6aff628e0cf964d92f90278757216d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfaa36d589b48a0e129c056cef4f52744e707a97fae5eac5d63f2b5d7b1d0221 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.20.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f20530ebe2bb1d94b24194fededfa8e3af9685e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d74838825b9ad26ee3b66eb7fcdf31a7583b1f08301baf5105c3b9b241b770d +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.20.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..291e7becf60b3edb11087504aee58412f97211a3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30fc4afb291e573307753feaf140ff5d7145d7bf5084fcb42518b8178646d504 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.20.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7df443cb283207e66ca59c117ce6a3029644d293 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64597971cfff06b3465c7d34366a61c29883bdaaf6e11a8a06e4832a9668f7a6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..88c1d42e61eebf559893f5759d3bfcbe3ecadc6b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c786989fca75f54615fa24f888b400cb62624ecc37bee2eb1650c94baa868dc4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9239551d0d6c7e42ce3d87f18c47f84befc08aa9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7ba057370ed657a2057c64628d2dcabbbb594a1a00d9b86f2afe916a9b39110 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2bd0d272509c43ab1e57ef49c69df83b5023ef53 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f6ab47cf2345626a0bb684b59ee8e546f47f28e90c3a91986343cf2fede443e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0857dc893b0742b66712575c2e5ca2acb16ab217 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91b21caa9cc89b6a4b66797f8ba99ecdb6c8bbc36332aeb13f25473092507ac9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..850966d75278c7b28bff97cdc231c37d3fea3e85 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84b02eddccd1ad96f05576e57768e3570dd93d6105ecd350183d90c4ac12c63c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..30c77e709e4b6725d1876777bdac39a8ea9b3c50 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c61b5401a49c73c4612e70eb4f1cb18861464fa7482b87587fac6ed25a88416 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ae8f0afd404e799cf2d89b5cc59e1b204be5419 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5d0f20e390f27efd9f666b9a890e687105efe811f9fa3df4bc876db47b06893 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..edfbd92b97ec9dc1d905d0447fea843e5e485d33 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9edf23a4ae767e4024186d6b8a9437f0263997ebb07e7697706204e90c47e1ee +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.21.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4592c1d311ea16ad0641c473c6329b7058aab58 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa9e49423c130f6d671869fdb338a0d23e182d40b092b3733b39b7e10dd85589 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.21.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c781cf40508b3697cde2e72e1f3f5841b6ceab7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82e843925295882a8bafe0abd6d8360ec36560f9a1814a5ff5e45b954a889761 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.21.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b6f9d84c60e05d5947c774b81b652b7adbf8e33 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a9927304f46a74d88a562a1325169f5b78bbb9c139ceb3c0d0266a038d79c88 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.21.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..10120d1033d39d107a25cfbbc4684675677c2f4b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d29238b9f02bbfaac2a0f43a1b506fc09b8a5cff0ed4339f9310f61599f9c236 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc4799cd0f3dc5dba7f15f68cd29c6f6e92c61ea --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b55cdfc475d3a78a9895416a8806f14a20affeda1bf1c7397dd3060f25580292 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c5603c81f8ce3fabd739221684b229afe528a99 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4622adbfd48834fae351d45cb1f80316725a2e3d54cf1840bc175f7d515f3ba9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..334338ea639d10d92351489f704f7bd38ba7de88 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1c3caca74bab25cb20418119334aa62eb2eabc61206e0fad3e4c7ed1479f25a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..692fa20592fd589956ee11480de36240ea4fe70b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fca5028e09924f5b5fc9c23a9fd9e686ffd59030da402b63105c58cae7d8c3ba +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c2b48202d896ee0258e4a0c7682d82d0c048372 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02df9b41ceebed7823ece477ace86865774a49c6f5d290b89ec1b31973e19f43 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac2e75849d6c4f9f2cf1c39ae5a37459b77059cb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f6d8b3d9f3c03e144d16dcf912e63477f240b5357071f3f42bf7672328c2603 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8d6528833b179bdb6dd75adc9db9acc6fc46b04 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40ca23e6919c043710d02bc5e1a7ab04aef71c7d26fd4be3502f3cc27466d866 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..569ee9dc85242920564ee205d00135681b320b1c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08a21c846b0b90f55721c46b14345f6b5e9a867e2322bb27027814acf9603678 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.22.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..270a150c3def1b4844e175c44a31d6aec4690266 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88ee6c8b8c7fa7e1ad385717ce82142f26ed7f739d0a540c814e43cfed1a3d26 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.22.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd09e47a0b7943666dc98b4e18aaad65bca1924b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:996924f86e3d78f61053794c99231059319325a1819ad382bf7d36ced10c8b32 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.22.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..827b6dd8eaadeea154e4f527776e4a3528df1a96 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3bdc99c0b3c88ff82e2e6a5e1113f370ab1aa692305856fc043e4a49635e9bd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.22.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d5c96eaeb15d4fd2c1d58463159921b85fc2dcc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc7da5d0c6f7687f1926f099d34a450fee1eea01355583df0d1b0acbc9e4129c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5aa14a78231a23a9783c02c78e9c51e36b02e27b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb7852fa1e27ed1e5720f31d5d70fbcf08035f9dafa8a30f4eeae89cde94724b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..70fb3ee0900d72a5818fe3d730ba9590f86b060d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf76bf9bc53242ab42ebd8930afb888a30a51d6a4cc902f78a74456ffd996c11 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b70efd60ab19cbf793ee5f7f05bb69178d7e606 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee56096335245c17f5cf744362ba15dab98cf62559f767bacddd41c42323b38c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..31d1dd00c025046b01c378dda5b94621013c70d3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97a3b906bac7345b6f3ca0db637ec2b78d0f14e21013cff5f5a81ac2871fc3a4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c5654dffa7d3f1cb62650f013d64900ac1e864c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c334398d5ac5fa35ce47697e578e7daab1c02ebcb57246ea5c3e5360ee7ddae +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..399866bd9624266713250fa622e11b478e28df3b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:391592c2d63195bab1816bc3a2cbff0776ce7148034f83be4cd405190a8066ab +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6b42ec29dc11a25950e9570a825b2ee3b4d91f4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f768f8df669accd99d07183e66fd502b1997f45c56521a6b0e44a2d2c2c976d1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0cee76479a6c7e527416d0ffa8345ed0a5717afa --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5086828ed84364ea9d472bed3f17b97c9f8e58c4b474019cffcca0a46874c4a2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.23.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a137de14672516d6ac570ab52807d300e65ade8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15e72f05ac0f57c1d0e172e664324443e169f792d201fbab7fc921353d7b7556 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.23.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee036bd38fb30730865fccb21068d5d8259532d4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6f750631b117c8056c37ee71f9bfc591ecbb747d73574abc951e289ed8a4e29 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.23.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a6b1bd28f576efc706f8e53ac8f8c91c16b6dfc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:249ee7d904f3b111713c341ad8e5cce2a47273ad04fa3ec83205d53652ed9e70 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.23.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9dc2df26ef686ffa45d3792925fef48f6785b8a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:724ca8a780b70821b4e9cc1ea834e03ca325ba322e7f225579c55f1793653efb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..17b9dda288bb89f3091818b6acaf7db22e55637c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ec99a7d32b7cacf51a60ab3b4f9f2ed66d87b2d15784e90f84a5580759f4bbc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4caf67347fdde86603db3acad14c29adf1377792 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99f4152c3fd71bb9b71b9ed5aea89e45b4eed5ab18ce6df86a61a87d46eb5246 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a529a3ca7e993a8833bc92c5566241568f68cf0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb57671ed76f267c72459641d6db31b7d86f106b080dab0f8d4df791953939f8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..64efd1710c9195f33e2345a98398b212d6f43e5e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09f7f8e98e6a3001fbaddc3d1a75dace7e474486c4cdb1d440022e70bad07009 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d1206f9bfeeb778e489f063b4c081960212587a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7706ac05ae3e70ff163beba3d9f3d5f240b23d284284503811b8524ee04f1696 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f915ec62012d9395a8fc90b40ab25e8705f5242 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40191ca2fd7d8089ea12c17284e9fe77459272c03635f2f511da876df421e183 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd7ed171c58c12158f26d018a4d9503feb3d9598 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:337381bc5909c1e0959d14dab86a791cd9299f9c5ade6c514fb60a986fa6c60d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec628c12e69b447e6ca1daaaecb1739b8f1f7151 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f90f0a60f5774721a7eb27b1099a0d1615890d4d3b50d4d25249a7e2060d7df8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.24.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..91d88665be1f0e2eb9f11ddd812a1b4c70646ba4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13a62fba3e211db5f3fefd79e74d46b0c18c56f5d33b1f4757b11f009300000a +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.24.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e25c1e6a3a21f77417f4be8d0afc460732ed9308 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d35e059491c6887280f583d8b3cf09a082c139575e268f3cea2fc09ecbc7d748 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.24.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed1358e538eaa1b1a61e68b1a3465f83046ff0b6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:191365850fcd2b61ae306526e86ecd7211617f252875cf0fec7cc0f2233289df +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.24.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..98a81e33efcc8114e10a9cb380c13a038b771ebc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e0ed66e46a93b02663a41432f203af5f7e332f7770a554fc916ae67b5ebb148 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e883c2a8affc3e371a4de37addb354b482ac05c3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faa80395d6a203bb453693ad63a7ecaa14828a634d477863123c8cd942e7348f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..297d4ea0418e206a28e998f793887709d754f1ef --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e8850a307522931ca951daf44b6951f1660d0c82517b800eafa4b276fe8202e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..94cd694e1873c287b335848db7f0352c69c774aa --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9632e013687a6ed6ca039a3fb556b7c5100399a0af56de2aadc0986208b591c2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdc093cce67414319afaeb603bc3e2a2dbfe0101 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65cbdc77285f0c7c6aa88c2915c51d2a735083625805e6a7e415d7e9dc61b25a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f3fa6339fa972961832db1dd0c79a55ab58bd78 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f11feb9e8f70de2445d35ce428e87dde85f002fe505a9756e82f81f898e6e15 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0382819895fd8138b347679d6f3e51b6c2cf3c5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:546a2419f542198d3a0563bfdb9fcd2ae712fda0be1d3b693ea1e759318833fa +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ad04641160cb79dbad8fc24c275e7d84c11281f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d939e9e1989b7d740ce6fd9647043684bd97dfdbc02d38a52f4345c5bcf9df6b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad3d38660a63d310d0d0f150ddeb8ecd397cfc7f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec98c575ef558b125851ab4a6d8e480c843b46f13b700d96e6d698d49a27df4e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.25.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4213dfec1a28d3b30cba7dd0daeba8f1a6fed1c5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcd726127f92c6b74a3844aab0794aaef5f43adbcb42595ea63fa94b46cae343 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.25.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfdfed700b353a74b4ad0722c5e38682bd8019d4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f7f816a33c74755fae79a71fdca00ed00fd7f9c7b357255780d88b57289a8f0 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.25.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e294a9a5c841fce81bf229f0cfca3a397a19ebe --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e309e83a44642b4cdc4ccce0026b967489ee0139f59ec1958219351aba947ec +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.25.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..856de5d888ce89bce60219e6237b1b4b05a44186 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:235ec3dff48786bcbc0ad88159bde993b5e07393829cb056ffa21be3ee9b8a69 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebbcbd1e010656a0eca7b187fb3965fa4cbe54ef --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3513f994ed38877361ddcb58ee734094155a37313dd31e2d42ef17e74a7c13e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a991cf94ac69d61a8fe155d60685641b901b0b65 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1dec213356c5d7018b0cb490c83a0ca21ad0c5a775e0f3ba20a887b423155f8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6cd9aca494bd59d43eec1f6eeb10cb60f2c55091 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc8061824b28ef1694fa2bc6af4226b3ebdaa12b734cadf3eb953e21bdd4869e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2510ccebe2052ffafc430627ed9e2e62b7c69ee --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7dbb40b012369957c166e651cb7b9cd72a548a65962af08634b2e9e1c058c69 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9eda9fcfee06458ea7036f0e3425186b04969604 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c20ca060bc2d08362457518dbd38c617763baf44799fca3571e0c0687886a54 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ddec451614b54a1733ab202d2538d4a7cd1883c5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bfcc4939e9391f497c6cb9f02a707346ebfa4112c87a477963cdac87d05b188 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3d2ec9f2ca0b66a017cb56c2b42fce2fe4a305d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52dab8c42c6a7fba9e74cdbe4c9c8767a5f43951c33311d2c5e33aca5f253216 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..55923c44eeeba14d2fe2a6d7aaa3fed4cc794e17 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d60c6c1db1d544e8ee036b3fde12f7611ec05603f600b86fc6234d334aef85f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.26.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bfff675e2ad595f0573abdbc00a5513ea25eaef1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a29a243b42268d514810d679de2b311a8636792e303ea982e09cf8e12861089 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.26.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2add7a65e46c12c5e996ebff320f2c8d56d0d899 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:196decd91c905c7a6f30f91cdc82ab8443cbde5886eb4a93c7ed3e55526dfb9d +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.26.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..60e1264dfa1ce0c2b86d32cc096d70bb09682fd8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a6f11d45c0efa721c96087ac179207394eee6511f0d0a62c1efe7cdc1a240f3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.26.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6664687e9ff1c7203ee8cd4c24693a030cff2998 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa075c16bf907653a1843e30cf76b302110d6c12121a486befb25cbba15a1414 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3ed34789feb35019d63cf85b72cfeb2910197c2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a933fad6fb4bffd1eeac86c17d6b63ccbc8c6b81fcff7817e0c6b4c42b1899ec +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9446f60c3c24e6df4f7e04fa6872aa4fa3fb5c8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:421714b461d3315c81059099356250d0534732f619b74983e2d128b5083ca064 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1fb94117391add1bb3d718ad75de2caf2c4686ba --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cea7b1236b1a7d4692de897d94e00823e1050ae2a09c9b2529fb7555e6110391 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc8cf96d95ccd55b71bb1b9218043c117f24cc83 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0916d3959c708bcbde0c10f9ecab1ca5fbb80173fa4f598e472f55f9f3f87ee4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d7205fc2227de4ad85f3115d71b01135686da43 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25b31aee7aec5d220f948c33cf6457433a176ee867efac6b7de668b0adf6c609 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d07da30a1f0fd3f21a0bdff04c35ee4c612733b0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0d90f94773a9865ca2d60e5371840c808f562346df297446b0a782456687ccc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..030ebec8bfd04110909437a7da38f96d90fa3dea --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edf246007479d2a3e5cb2e31a0491ed5fac9bb09a7ac26016897ab88191bfac7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0158abceecbfb69a49573e6d948431c9d452d041 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe2f1f3099a20b12a07f7c35776979ad40f952a38eb66a9e0364528a73a2a2f8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.27.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f2b7f8d686a12d2248297ca437a4a7d9246e76b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fb5522cebf936ea2ec52e9103936cb138cf8ce04e5f785bea4c97a6948d0d08 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.27.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..12d92cc13078ca16c8001a45dcb95f6948a8d1a6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:713f8e0614d2c836e798b37bee298ab5ebd0cfff030152e9eff68a297414d2ad +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.27.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4946c757f4df905009ad25c40ba0d9768003230e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26745271d05238aee8ec8b1ecc039481abd432174edb3cb29ad3241a95287856 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.27.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..15e2a2909f2db02864419e00fd7e34a75e9c09e3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7ba553df7daf6bc5213be3fc749948bafdd400d657e3a23fd22b50005a6a265 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9299fa44753b7b0bf508f147f802dd63aed47db9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6698c037d858859ad51524441f475c6592711c597a478c092a064d22347206f0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..683072df8f0e8ab4e5c0c153eb16c4850849faa6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:883ebf9807ffc3793970a9222e944a421a7221899de36c521525b160545cef91 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6207760cf27fd2b8d532bbf112935317d87bda05 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02e38ba68d1833fe472c4f59b8a11061981cce8e63e9f05b786b4f99f614e9d8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a03a6a85f4db9f5af3448d69fa9a8666675ed85 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cab8be1f0b35a989590b7f43a0960682fc059f101092cea704511a6a05b45249 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..97b927024d1079addd7feecc01cd38f5f6b45f99 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c66791bd4c3bde59ec32e70be3c67ab8928e74ebf852ead456ae7c278e32f05 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2dbc6004e0ed389d42289b52a72ec748fefeee82 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0378e677ba6c7a4846fd3404f297e40d44fc8b922446bd8a25f0ece53e6b072 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c5e207f9fb06f97ceca606c14673a8fb3393bb3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7363c6c990131e9e0d5479661a293ff9634fb5742b4b876c4fc1aafc7abc1494 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..86ac03e96db425c62062a34da473bf2bebc5fd60 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d72790f0ca55fbfd48339196956742852eb85e4330953e794efa9c8c1528ec1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.28.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c10f281077b5991907300300ba4a37d46e3d8f3f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f44b0efeff3bd7ff27ddbe544762d519a6154bdfa9958aba57da9d5f2fd7fc5 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.28.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..511910e49adbb153aa10b0566a7e944261b710b5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ed44f1e67a8bc189718c4a9bf9e3b8a18699aeca12d2c30ac693067c1fc609d +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.28.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..21b441ccf81dd3d161258d350a29df6b536061d1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c11d212de6c109f72d446cfd51f049c4dab806ac4c0032110140c915c5792269 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.28.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..48cb7a6c0c1c287dd7637dd9c40e336b5bea0084 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3057b0ca0e274198c467f7aaccb63ada03132a2621c71d798c9d73e5c68cb40c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba94f5838018449ca1a62b35649ea906a32270bd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93efada3ffa9a71f3af6b0762a7469251b9d5e88644125c56f0d7deeca99553f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..51e0b431ff605974c10e27cb8aafb4c22c430403 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bae50fdb47b90f1e360da25a1543d8cbab7860ee12490374617d0666638cf3d0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef5c5a726ae28f2de75bc0ec894ade958d636663 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81f180f35904689b51cdbc90d06b58af4bed80fa324b725c59b6dc47d972262b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..01ec1de68e8e1e690bf8655269b7b214083f59ec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d4ffbef8fa0b20b80fdfba6b8dc1ae1c32b72367af9666a9a7a34d658c97bf2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5f357654053497c8bed6d75adb3157b0dd77c5d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:291bb64c660c6632d50d8ae54096e7808edc693040c8233df2e958dec26eed10 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c738062114b0f6c4ce6774db36009d2e40885da7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c992f1712e7042205e27aeccb3df4c7b34765405b23f671a9aed189aae169127 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0885ec4c506e492f0f5cf9641baedcd75025788f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eaa40d41814376f0d6895fa4f9c92ba5c6900c94edec17f3dbb2e0316e7208b6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f5da2a67ffbf67810a7e7226d8d2c5397f832c4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf86d57144f48eae0ffa4469893a6fc95041c0b1a69d76491125b6b6875813a8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.29.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9c4f87352a1ac27aeb7333fd156bd41c83572cd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dde89d4d59dda1b421856b155258bf3002162d6c5256cd99d4602c29c0d54b2a +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.29.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..92161d5d4919f86a76ea074b632e2804c1982c70 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29b6cdf27ef3d183109d23c44d6d933c156a5bcedf183dbf0b2d881994912f0c +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.29.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..47659ad554728fdca4422cecd29e087f97231e3e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a64ffb17e3c10b71565b6d7930853483dc0e2aaf17757f1324dfa36265b0f024 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.29.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..65211a1d2697493029515079ba81bdfaf8329392 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:282a9f87d609d5302f17042d892ab12a16bbf4548ec9892e7f110ce66b7da7a9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9cdf9e445a3374ba6ba2e315b9f5f3372f26258 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:734b7d0bfc6a2655dcc5ba4b1dff7cacd94bcec4b0ff5588a3a9c1241a7e5e96 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e214b94196aa8c0ef852b709ab9e7169d57ef73 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3d6c6e454042d6e59cad3c5ddb66df6162c568c468a311e256d3c3f15225af7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..664f463d463d2db7abfd27b67259e169fb632935 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fac65bd03da7d24ab39ae5bcfc12e9b6f1198775694ec7be23ad2c0f074ca6c7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ce8ca4c85c049de163c9b0d9a6b4be962e2281a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8044a1a735d5317b2f58e6607e6f8fd577599e55cdb0494a82185b740ad1619 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..054fd2f7f966a3c7dd782cd81834ba2a3ee7606f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc854462e5086b3cfc82c25695920a0db2b9997adc2399ae3f9d0f76892bfc34 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..705c9effa7c8a386eefb87ba70b4221ddcdafeae --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0a520b7cc8375dbd1edce8b8e5724682bfd85f767466db278ccdea976cfc971 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cce92e2381f3c56aec4d834d3fe6e28b30abd54a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ca5187b92dd4e06786b815ade48a0440f9dad4c7db0526318e2f9e2fa8ec7d4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..484f46b1925c5fb1db1d6476b916c2a735eb6117 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58a06521f586baafac0fd0ea70301fb698a3e0ac370f7edb2e2469d6acee5ae1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.3.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6f91ae340e607a1dfe55e65a5e334f595802ae6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38d3484c6a6addd2748cc86aa466268ee20693b02a6e240e34c29a8715109bf6 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.3.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..77c826d205807fcb16ff2acaaaae2abc5349dc86 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:518f81d89a72f04144b805e79695ce240598dd2179656eeb30ba09a6c8104f88 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.3.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b04475eaa10ba236899f2c986d85391ee4934df --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcb2e576317859b6351591954a828920cd4ff32734d9b19316dff621718724fc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.3.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..936ee655dc994b730681c9d8e8c9d26d1576c7c4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83093ab28cd8181e3c71a46d1bc55e91e8985302f8b9d2040198133cbc834157 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1fbc71ed87637d22275194083f98c2c8c225b17 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4b2d976a4feb11f59938786f3d723a14d2c715ebca2dc215629f3c86c39d51a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0dc79f69f3188bbe56f768c2938ae62bccb8d5dc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bace48ba75a81520714e2609422820e669acade5cd267fd9ede931a2699ad579 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8baf67b7b3d8908c1c2cd8491adf540e3447103 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf99aec650c56ef00225fef7e53c6b9735bca1ad8fda1ceaa9438ac7204633d5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7b0ff61adefa14a7e868e2904f40a3af41bc316 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d17f847609687e5c84a04b910cc14c2568c9f2a6611e8144b1e53aea4bb49bfa +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d474230187c9a9a5da7d72decba5273dcd9da4e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:596ae2dc2bccce1b0a426469d5791656cbfe6b0917ee64cb5228ef1b3c6c22d6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0965b64ce345358b747a18612774264e1d06a40e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f59c518cba0a07fd6ab07e1333c6acc431b891630e8d1647d59cfac9ddf98bb0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..083b6da05abc3d5ffe709f0fa8fc7ac056e6f89e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9366654b397cd325d65456003d8467c35833a5d9f1299d5c5cf994159d2f88aa +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..11edfbac7bec25687d4362e6d8da1f619204f923 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eaf7ba9be080d1588091bc7a0cb273cb19726aaa79e462f296d23672f6852567 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.30.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1bd6e745b3a7e528b0200d8b6a2a08b44fb174a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ceb247d8dea288e5b5170b168087f62f11a596d2c3e88e343069cf8ce402e23 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.30.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..85ba7653e38b60c60299ca3f9e73a12bf8cd9d94 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9393ffff64e44d292b51a9ca33aee398d25b769cdbf001e70e05ad815f513d37 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.30.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b88b2da329cc6c578579e80c99881c8fc80415c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c060d3f3c0fd8bdfb302981a15d187f724a799168489ff5942a62040e8a8a58 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.30.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..807fd5100c36c567216fce0b2ca3ef1e7bb55a31 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb6642851c9ef380414f6f1550960e32428d37559ff47218cd0989e2c22c34e4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad20a8c5e15ccfbb9b0bd34e3fa88591d988c06c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b7ace19d4737c53539bf4778768d5d2ddfa2a55f76f910e093c5885827380a8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9cb409b7b4c1ff90526653b94725671c0c26cd77 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41a66153c7d2279fdc869da510cca4fa9ba6ea13ccf384099b707edc135e6fc8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bd2e27a3d72c806519db0dea9e3cce496efdeb8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:146134af5bd2189996eb5a6dc54b87ee1179ded388a688409128b0c5d2aca2d6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d34e7dbc1c48771a54fc529a84d5c6135911a11e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33a732ff96cdc846bb771ea80329066c36459ad9b14d1027f62545a8779d19d0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3cc7d17d11c401ca436f5cbeca928909f603b1f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59e2916873cef8b65cd6c529e894d1ba0d710cb795d904641bab220730e022c2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..770bc99f5e1820a711070e62812c7603cd298e5d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ffd7c2a6e202b29e3f5792ad7e49299c3c11068df06381144d188e739af7241 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad2e40747cafd55fc1a3388e29edcf250508fc89 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb4ff9f5ccd4dea13004546d6660ed8d0a699a86ab96ce850c8886efaa259135 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..29fce33b8cae0e316f6a886ff9ae4617bfb70455 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40d76e163a6bc2f7093dcc945cb17434c8dd8742dcef7e539afb27eecd45c293 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.31.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ce080875ef29beb7d6e043aaf0a57157d6302ab --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69cae0cad56658fda389daf5c66cb5545b50d402781d27a9ce389b232c2a9d07 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.31.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ffd028a323641a9190b9ec8f50b1d32cbe8ca48 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21d7a4db8618a0b487b315a238a09b9fac5560cc63145e6d5604267f64831a0d +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.31.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a7da091d11f9710b61a16e90bf22c101162d925 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bd1b12e8af96981ed70d3f44e8a88fb596ed0e3810d5800781ba159145ffa18 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.31.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee574e4b651b9f0f37400e0f12e5a18f8c50f05f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3a1a0770baddd0d13ea1bfd22dc1f2fcbfba7511dbaf3b43043043b5fb91af8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dbfe9c10776040182814fead23e9e0a764c6f221 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fc98f3b3cdbc558151c4658a3622a73443ec01dd28dd4041956c1e9d993913b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..02ccf32b69ac17f9d82dcd2254e7f81f7866c13a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d55880c86186e7d9c9c0a78b94729e481870717a7d5495c1605f41dcdbe6839f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7478131de9b1eb3920225e9de0136bc308d12fe5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72e07b971797e302e87de2e5465178fb2e90ff3846ef4e66413650275b9fc188 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd54f5f386699b15922070410f5754b082b15c9c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c4268285e7b2ab5b16d9d10211e29c7796fda68835ad18d66a83b9cb1a9cd89 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9112e5202f60b43cac55a45139526dab027ef0b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abdaa538fb55ef92f886f71d117a79e2acc94d81bea1b7c8ec765b812f6860ff +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3a3a5969a0b61816cd9e58844d1b4a776af6127 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03b7f4dc380bc2397a12e7c4cfb962a71b4dad17eaa60fd368389f24d43bfeac +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3842bfedbf3dcf502444232e98f557d27c1c6834 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99327045bf35c18071edbe77f151769f54cf5dd11a44aee8a6d6016be6f4b2fc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d829de203361a72dc4c9e75314435fe840d31ca2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a27cd1d9d40d2c0d617a674b07466d695f67632546ac169997d471ee11e1dc12 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.4.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3d19b874877c1bfe54182ab79ff59ba242661c0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8521c24121cec5c6a78f146ffee7efe9dbdf25290a4ceb1f02ef3b248b3cdc7 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.4.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c88e75d573d2332c2d4f5f19e616a1f3596166aa --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfd4af489046bef0c7a93e5e45ac2e749aaad7639750b1a76020a05d55d8e8c4 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.4.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6d5d2e5758b86d695b4f271a3e32951ebdcf729 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e99765f1cdb0ee784d9d9e60c2e416009f9017d465f790e21891017c4007dd5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.4.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..24c948429b9a12caf4c60bf820b1fa5d6557d748 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1699c0c5a66737e52fa80af5f79443280a06d9b43c80cc8a840005b74e19766d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d048a0d79d9d0239a3b71352d00641ea40fb132 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3ca0c79a830cd090f6e027dd55a50d19cebfdef1221b4c8221940f6015e2be4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3665b82d5cf6d95a4102860cbd1d3fc6660d9fd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c0faa9741fc0b064e1835c7dca90949e6231c9174745a31644fc9a74d231351 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3188b8f68f3365d858566bc11081bbc703df31d4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef9c3542699f691e18a4518fa47af15f57730719ac57ed65474ffbc115704f79 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a9dbaf159ddb8d96250bbdaabdc3298880c9a74 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74652c467bc5540dcad3543c5dca19d3e62f5b31ddd8c2ddc3f566a7522b91ba +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..be90d326b4337f921f13039e624309e9474e7ee7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a36b64327e2391585eee1f9d5763db36143c5ffb7c86e789596a803cee27a57 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbff612cf8912f5883c2eb27100c20800f7748ec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66f1386a5c71f15f517690a0d89f1169dfa8e2612d74fb3d98f675cb8dac74a7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6b6851d3f10c6fccfe2200af1b3c82c9e5f1909 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3da920581c5637720406b7ae6fdc54c7cd01f26882b4b4ae1f3bb29481e45cdb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f67f7d29c3d025bd9c983fcb1de2264513719145 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2031e6a9916c209fc6403091fe2af941525f3329c7a3a554b30aa638d00e40ed +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.5.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e339131ed8982e07047cf0e5637d5d9dd9bc670 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7504daa22f7a20249ace65bb3d2789c495b8208df3426a9071d39746e024e12 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.5.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2e1c81b036ac476ae09737d8831c0a927cfb256 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90bee560b709f3b18149a13c54723b44106121c58e6066bfbb00c43ad6bbd1e2 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.5.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..473f3f5117b1c049bb6a38312473e2e63d6e8ea4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f9aea224202804df62d5012a1e23db10ed893dcddcf5e419b049bac24ed5eb0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.5.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6097dc452c006101fe5c8bba646d5964a2b1a354 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72bdbcf1b8e887d25964be91307fdf0678aa6946f0630b9532f9ca4bd2554527 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..20ea9acab3025bafd531fb369b26c3a2798b9645 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14b5a2bd55b3eef01d0a7aecf4aecf30165d40b59f91b688aea41d9cf348cbec +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..947a314481c7b6f277123c6bd1345d8cb08b77a6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f75518b2e6677baa273823b9d0bac68f1487d217b5077783819ec7c1c59d992 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..38efd152b3c55baef3cb358a2d13c8a192cd92cb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6450b38720b461b8fdb6a2f6608403f411820bf1f3ee2147d2c3b2a54030d48 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e87bcdb0b02a795eda2336fd0e72d20242bc8ed --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e6f4ae7875b367e656220d112b34065e1044da2eac89e5fb37d1c4909f8b955 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3e9a8ef895287fd8b9bfd2f7947d94ad4e07af1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6553f9b664c83b9453ccaf33e69aed76db975a576b4a134daf5a8a5b68cbacf4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6adb968827844c5ee1b2fbc668d93abf3255b69d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1288aa7b726e56f365f19f929282203a6932719bd3fc346042b9bb059071e0c8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..507827e546c6c2ba52ac40d0dc0074300a607343 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c559fe753d0b9d9b8c2950515808015092e71c3e9fd596d42b4b5a578297e3c6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f04449094fe271de479755ea04036dbfdaca069d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:808f146ea5fbdb32b2f6a3d7b816d0ceb4cba4f23fabe82f9df988dc722d088b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.6.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..31413bd8d9ab3c6105831d57df284befea0a0a5f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0791c094bfd1c9f3b9974af533a0a2a980d4f2ee18d2f16926416dacb1bd89d5 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.6.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3a9bbeaaa405367e409f97229c5220fe8740a10 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2672f486cc0e47ae18d2bd7d51e619abe9f0328663d2f4d5d1fa9d12865c453 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.6.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a59af022e2ee5b7262da71fd1fc79595346cf70 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7cbda37f6fc05e10d24adf44c76d59090a9209c7ea21c12e4118b8118606a70 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.6.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..96b6ba8aafc8f56476bb3b65c795cec93bd55eb3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8083170617623fb7871fa0c426fe0d43413a2d5ace73f6596b958a804be279a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..37373a4cbc5d9c6b02384d8accee17648f4034a6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de4c3bc36286606c002bed15e1b48d7dd54e4bff30f72bbb071ae38ce2134891 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a72d6bbcf678d7b0edd69cc4aa5af51b23d4254 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc349c57622d602d097f5baaddf2cd57de0735cff0e9cb4c32c8dc1abd68ffd5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea7e0e54ca01b83a7a65c8aef281246250d10768 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4626ab6baeb35b3624a886b2f3387daa2d21f572861fd7cfc799ee8f8edb99cf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..74851dacb2a2bda545f8100aa11cd71bdc2d55b2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:634832595dab141c5221f308f94cdbe441dd2a2bf938eab96d9ffa5169f97cbe +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..508205b24842923946826c34ee9c2edd24cb8090 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edba41008a34092fa3050df8bb6e34555976b312786a70e73097a994dfdfa6be +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0ed5da301b94691ae47905a8a6438e085a4f7aa --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dde522a1dd126555211eefaedac3192ca30af46f4797969cdc7e99f7a8ba1add +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9538c7eff1aa5281d17f0f6c39661718f91e254 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4710480279bd6f25132337eb3b44afde3a0a4c22b3663d6070eb2d6124cecd8a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..59107de77b2b2bef3966fd9fde760f44a5dc0787 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bba1fef157cf018b45b608a984f88af06d86ec27370249d4bc9a5b7a5bd1a02 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.7.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..91ce85a00ffa59e0fcda314bf850620eb9b98bd9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cff6769d0df7b80c140b72c23383fb767b09a7c5a864f7c45d4de33bab794928 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.7.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbfbf6e473a84415cbbd130b52ba69bd7472cfe7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:450a9595eb901bb2c8a7a65dad9c542a57340849cdf0c4640812541ef28818dc +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.7.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..18f8059b95cda1799f199efeeee3787187a01c0b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a33255c98df795bca6dce62138e8c7f74c1241e29863caf688612c57f1155db2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.7.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff27b0b52103a5e21d7a2a88d4521fdf87406979 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:100f22518c60e6d59a10586837a6f616f4de2b02fb3e83a74ea1cd0a116928ac +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebf6d1b59cd13219cf8513d837f13d68e20dd97d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7489d5e967729510f5a287851e3d188f164d4af57bf4d4171798606cb739325 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d39a19261744b7940f7124ef8ccb2991ac942609 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d207c5a045e99d49c2e42fbe17c8abc0b3a06044f649248c5e35cf1d512b2fb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3e7f0f75306299893b959ecd65babd8dacaf248 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:baadb0f5ec6811ffb0ddf8cc9e1850fd6a09d8ab02678291d56ab3de4e3acd53 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbd8e0c2e1c7b6f12fda11c0c39776638fddc781 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c646cfec3bcd0c97e8fc57584834fac4eef600f19ff26604307402c5ef53834f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6d293865fdb8c301ff5bd6fea76c4695b5c3508 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c69ae277c0c12086195192bd59da21030d46364a0ed9839a3702a1110c461e1b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b60b4935fe5ec392e68bba035b2b009f649a84eb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c73943848ffe22906f35778ea93afa01b8174beaa251431c47ecccd070ef4301 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb92bb754c6c653795aabf8d2fdd60861ce25b22 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e4745450d898bdbb6874570a9e82afbaaec69c939db6ad685493792167cf912 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f056d191e7190be7cd4dd3f3748cadadbc029f98 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ef3e4761b71c5963a00a1954ff954f40a2757fa787f444d27effc83d355acd6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.8.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4fc3fe02d7ce2e4c7ffba91e09daa0d5ef9cad7a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:496ed07cfd84da1a40115dce00dd01ad2963ab5796c10ef6b6a65e6710e59773 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.8.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5eca43a8f06eff99afd56896b1bbf31b6c90e6ca --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bbaa414a1b379106b42e8d79b13e3f3de169d176b13df1f5e134d11b3e3543f +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.8.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6fdd7c04f5822c85a33e863070909a6d1840c97f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b25d21be954f3a5681dfcf9b88bc2321619710507b6374793d9e4f034a02d1c6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.8.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0cf78c68be9783cfd3befd3834777d0df91ebc5b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:172f687983e367d9159ad42a48b09fcb7504b926adf6037ed6813264989f7368 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..944953bb1941640e836deb2c964f94d8fc4e1693 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecb4f1f0c0e17bcf764300f11e9539238753db6b7da3da9dc4bdbf8aec23c7d3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..be4c06cab4d334436eddc6f92fd77aa7efcf6ec9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef362a90cdfda476cb79b85bca2a40e22aac572081936b5d1319c1bbc2bbe9b4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b74e9bd7aea2efaec9ccdb6aba316a551a645dfd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65b8374caf4dc1e525cf888c10c32b130b28b6a0fd39b5f6f406eb74953710e8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9eadf0409bc3f4eaf28f4d0cbe2d70520a8b2ac7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d00dc2a540e3be1924d64aea68e12d081e4195e582cbf5948d9fe8486a71f01 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bce5c6148b4351de237d2019199787ad13507509 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:288ebd1f49a21b804778e52f121c4ea45f3f7cd1ce52a91d25e96d74020def6e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ecbe3c203707ad754f9ac119fc6380d0418fd0c6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab106eec9d641158e39194dbdc4a254d3acb4eb4139bedde115a1031eaf380fc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..28052ed86a61147637e7923cfe1433005b20fd99 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24d89c51995021d12062a237a3d476b28ec462973aea50e3e98dbb07ee148e95 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f9934caf15bdc247db9680e00bccd7e28d84dc5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5910102bc67873b79ab7b71c24a852df48ffba3714a4609cf2996eab34213679 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.9.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..04869966b7b6fbd3bf5213b32bba0ac73675ea20 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:314f0db5a84baa92be86cee1290c440235a545bfe036f42da782fc344350a319 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.9.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5ba3d3a088338ec2ccde94b3ea85721c0c77364 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:005e08587a2ac5961dfda2d3de1e7ddc0482422909d971542fe029cf13f94810 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.9.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..01f33c162fc2f9429fb9575713f9421c6c2588ac --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28f8f9c5690857e137ee9d4c16574d58617cf6edc63297bb7d02c69eb98efa89 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.9.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb9274a91176c01470cc343afd5133e02074eaaa --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66512892b1e0c0cc31fe38a2a8b15ab77b8fe861f221c37c78e9231b363f2abd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..515bb72e718c2921aeea6e67e808cebdc300380b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aef80c40b1504b3083a62daf00cee049fb641c6f27e7ed1959712f8fbea6f324 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b50edab7cb827deab2c8a27567c70191721db76d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b69e94cc06b3cda2310c06606053056479ba8732d4576b8f62165573c9778763 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..19c7e10e46cf2ed0c9fca5673802bf17aa16b49d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:443ac2f9e1455065c7b64e9f1f154279e8b8b139ba2e78775cfe0bb63647cf65 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..48bc588ca7eab8e606a4fc56a2e80ad35576962d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1de7ab19ef9b61cfa5af6f7341b34c1f65f3a176add880648234589e970901de +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1db2f71042fccf785b7bfda41bcc29a708eacfe8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a999c07f8e64fa8312f4f3d74932d59c9fdf5633c3f04eaab116846a9412344 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c8a89a3cd668ea18a687de17c11a4cecf38c1f0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66c98449b803f7a08f706804447d0e9b0c76d192facc0bd04d1480f266dc1d00 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee23e8fc5f1888bb8a855ae729b3c2e809305cb1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c750d692f22737033d0f0067ef8cdfd76e642eb7c8bbadc5a7fc15f9361cbf21 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..be05d5475ec5d16156b5e7dabd4a082ebbe4dae8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbbef3a015baf38785beacbbe78023bbf50005305b0cbc177bb9d18208b55004 +size 11395