diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/lm_head/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..400e27e9d670a87b1c950985315fee980e98030c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84c29e156c1ff233ab1d70419ed039b29645b55825ad507a9e5af986fd4ceae9 +size 205955 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/lm_head/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6b1e89375b16f2453b19a52ade9895d01705d19 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30a4f4cc70d017f1431ec0c9b00678b1737f9173d7814141a8033ab1afe3e9ab +size 205955 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.0.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.0.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe57b282fb41ba55ef4f2214ad59d03d087d5304 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91fdb5c473ef447942db7875d12ebdef4940c2182052cb35c5abb5866d6d3158 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.0.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.0.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b9a621719bce01e3ac9387ef3995ff9fbe8b579 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fed42aa6bd630319fd857d3045483ab8f264574d4262ae29e4b532b5a6b6321 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..18fc390e2ff170d345d64da09b36af3c555bdb09 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8da4000cb404ff5c8a7d92729e0dd3edfb5e4cfdd0067d8c69d80aa6b181276 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e41804027135999e308124311c9a8ee8984bbef3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbcd0f3af808bb9c43d678dbdc3c597a1c3e42fe999679935dc27d6775126e77 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a09b90068fee82a309c2f79609848151ba1ed52d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44053f0fbfb4ddc207f4cac80fdc8547be7775d2f47b83826fdfdc20413ee566 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccb708d469fada600f142f272a45b1cfc5f6c08b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a13fc0dec5673ab1f80a61e7b47e8c71e17055fc7092281caab44ac7ce4fa73 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.1.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.1.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aca9625d4776a4b1867a8730eda5406eef906cce --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63b3e9efba085ee57e7ba29fdf2f05801892e992b9af98ceede4c06cdc7ad62f +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.1.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.1.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d48a0f5181b38dbfdcd09864db2a8339aea6dee7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5781e5cb20dcfb78599df23dce24b42b7663d52832a3325506bad0830ebae932 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..51212367f25aa5e2f8662038020d43443f722e9f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b09e79041533de2999e8ac375af7cd4ae5e11cf431b75ef8cbc36872b400953 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e82740be4a67adffedc052bf7b9b0d7280b26846 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:823de31bcefa9fc269bbf591d7ac582d88897187f8329dc659c7a39ba89e5d64 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..df3f68b221bad28b5917f9bed480ea471fe80cdd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c212d25c09548a97d5c0504e56a6c0405559cc588e7507043b94714c1606ca2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..03b321096b8d1672b246388285844beed9e5acc1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9ee4918892e4ceb9eab4a1685c51c20db8df5041372ff664d51b062f2e795c4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.10.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.10.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..848b223df3164901d3cd89bb8cd3036187b0f106 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a93399edbc8cc4865e9e66dace8dea03f1bff84a3a270c9a590fdef72288c20f +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.10.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.10.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..13c541978d1f6a10c43e026ecafbc7fe35f304e4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7922f68e64115e5d29ea471fa5b92c29157bc81abd004706058a6841807d912 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..19cadc2da77a50187895b43012241ad7c814842d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3d155ec07b04b549220fe877c5420a33941998f74cded54d518a5f106cfab37 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cac1c13d42feb7684e7020750a9867e53a1d40cf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:103377f5847420c2c4386036530e0759635c266068673ebc6207af6f2b475816 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..92df53f25e13c6db7db815fee9b4524e4ea57b34 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cfe1af5382ceb62f5345f1353aa3effb8fd2555f57eee58cfe5741115db1d9b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6f8aba36aa6d6983ff6ec5e2a37ce3a9defc152 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1449469ed0f860b2ce2edd878b1994fb25674c1dfd8d86629ecf1dd57cadeeb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.11.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.11.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3b0611c6317af632e9dbbad2370fd87875ec46e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49d861d1f53e9cf68a88b8f155db7086f7a88eb32887151386ee3d6d2d18784f +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.11.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.11.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d967933d27b818027f86c34eb0760638a84f4e6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:882dc30e051f5f4bcf5ee3164dbd7bcc543002a5fef2e607ad687cf94067dde2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..33bf78743e1c9dcd5600e35b1c8627a5a017f22c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a79f62415eaba53cf41a1c747c180eb5d28b72dafd125481a6dfc762b6434130 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8d87aa8f5b338de74c3b6522b7db5be7ab1261e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ba15a80cb04e8b760531dba0f94f4d93b119748ce5186de63e3411d61641abe +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bf4192e22596e90444984541f1902e43f01a86e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f8b845ec508b7f6e5b7051a59bbde5c70fe3ed99e02110c198ca8f404d2083e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d63d89fef58fbab5edc42fca230cf0dff0317e7a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a23fbed056be4cf19394e4f31055e3031b76a0098d54e050f6b568f754d9c2a4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.12.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.12.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c8da0d0394cbdb57aaaed3c40553d60a5f32c4a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ca3aae0cb14ec484bc79da77a49137f1021e78fcb92f472cbb3d19a2fec5211 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.12.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.12.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b58a4d5fd2f8b65c9e462085d96f3e1d17d7ae3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c034c8fb90adfe870ec51d39cca83db5d2e380c5014ad854f5ec670656c0ee76 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.12.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.12.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..89109122955cfc9b098798f6a5a03995736e2166 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4884bd003b18e6b47f2effcccebdf6431403b4b65ccf0fb248ed5319fed3caa +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a79acb4a9663fab6f4c145b9c3f38a9603b11ea --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97ffd2f6ce7b6a12a0b9c9dedc7c32046cf5ce3a8d27c73275c17822172daf4f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..397e29a4f93f21269084b752fb4f903d140866b3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ede45fccefb897d681e93b9b650ba1860bf607c8cde70067af7d0eb84e4430ac +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7242c0e43006e086198ff395082db49af8362ea --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f54e400a404999a4c67600c39ef27b113e7d5d37777d0b0c080f34df642869e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.13.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.13.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa1667af5d877df38353679c72961074fa46711a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42559458c58805991bb55d192c1ae0401a46eb8ff2a85fe884e9b6ee134c5414 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.13.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.13.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef8de8741ee5fb12191dce76f6ac46ed0534db01 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e243aba70c46ab3868fc5fbe603f7a4dfe8fc974fcf113b6d67e72df5588a144 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.13.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.13.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1618af246e78f13d001b1a6d787ba8681f725d3e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23b72b493bf666338958c245145c35946f0021975b46c35ef2aca4d049441a1f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5354bcf31c3624b883f80c629528c87624ef1322 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ebc91b4b96cd201d93fda76b4246f1bcd817e5774aff28d3b55d6a08f223a79 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c968acf638ddb5520ff459ceee41b7aa8bcf4dbc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84f0d4c1a177487b3b308897efe4320ac151ad854bee77c2d42250b840d992ca +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ef4d15594cd1a655949cd3e7de0e963c8b49f5e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dbb6c3bcb6b7768c27317076a9d6d622de5fb8ac8ab192f71280d9792e5846d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.14.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.14.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..459688ad506a4214e948dd50818a151173b0bf73 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60f8ed9637e82837d03b429b8cf5c99da57e52eec7401c5070bc00ced6dde880 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.14.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.14.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c3cbddd55185867a0d8a350e982d97861113375 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad1a59863e5f42bba4c2c1118c3fed687e6bcf3e53363947f0f81460089e34fb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.14.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.14.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab5a9876917f572b601a233f90a6cf446070544a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ec786992d2fe869f524edab7d3c99a1df220b35407079d09de26a302736c6dd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7de5b2d872e91d434f35264d2a00b2a7c6954a6e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:692ffbacb42c52243357074c1c20f00b6cdb5caa8496a31c99b84af8244d9c73 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9365c3a0045b8ecca558f44d3afe9d170a700e1b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ede245b38c592d7499535fa8c330ca0c53ee2123f93a58fd0eccc531b640864 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..14910013e4f6a7048ae3512851252071599d345d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28badcb086b3bcccc13830f644be21d9ccec81ceeabdc3da3ba1853e703891a6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.15.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.15.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..60e7b3996b7aae3fa4f991dd46ce7b4d87e65b25 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b16a504cfd24e19b9bffd2633539179966c09089859baa4c64cd830efce4a1f2 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.15.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.15.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b38a6e7943eb70c144a42d793bad4cb8ae95cd2e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36a5e8bc579c9788db138bb0488f0bbcf896783f8b3abf395616481a15aa4d54 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.15.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.15.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0fb245e6edf54b3d7054b193a179e71a1e916bfb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b252a632f605079fe1a5b0d53029620fa74fc9031bd4979f0f6f4554f4d56aa +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbd941871653852402499fb1fe7566b74d4005e3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74e74ace1a8b7804e4e99ae1c36a2500f4110a23329fcbb480adc4d89e8b043a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5a3bd6a5d43a02aafe9c9ca3be76a33e46477aa --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe26b32b70d595ebfd591c023832747c69b1940da31e32069c20ed015117aa79 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..267ab0752e508274f6ca735b80a0c7b5d2243a37 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c9151076a58c7a797043b031621f37e15ec6241eff0111aa520960d75c7d431 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.16.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.16.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c76c2bd17e94fe719c1226f6ff410f7301875135 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93cf4bfab2bc686a983b85f3cc1fce75a3418c997285ea5485c4eeb7958d8dd8 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.16.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.16.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..76780e0f9d438d468321db8bc0d0fa67cd0c440b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b1f514e1d760094fad8c9d78252210682ee1b72990ff0f0cf333d8225d8fc9c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.16.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.16.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a353d3b664f793521b0863f3fa0129257867485b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb6f40803403ccc7135cac411b24e936e579542371334ed3348453ef565dd04a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b14a6f58504f63c4201232a144eb11c0692059c1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c25fa123eec1cb678c1e0aa87e73ae200e6c3d1530b16d9a7c0d5277b4d3bba +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..153e0ed9b58e267f5bf500e004115ec320cb4f3c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7904c1486e0fa7c0a6cd204009f2cdac03c653e2cdce4c5216969ff12632fc46 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7de0a97ada6d3af5531ae80ae9984173c250328f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8463349b6bba50659e7624d5f405b3ab9de99fdc70af952c22c7521aa1dfe55a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.17.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.17.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba82d3eca6f1c1d513837ba7baee5233702eb865 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd46089bf229780f6601469ca77acfac1e368ebb1cbc53c5cd8bb5f2582b24a7 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.17.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.17.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0e6c1a4e7fb83128ba5213fb202a1b21014c392 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5a452aa52eee908c3b234de8654d5c6c7ee1803388703fcbc858f806f2e51da +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.17.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.17.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c04f38aa750897b43143c336d3d9797ffc8409a2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b00b3288bbd482c0d9f50e449731b8904731d97413d67a97e06ed80e0eacfd16 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7cd1a7a489373a8f968aaa43a516d30a2fa0c44c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74a247202e68e3919cb1a6cec36c4033f3044c9d67286128c1e8c5ac13e896e4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f65e4e206efc1a1e3675124456fbd35f2c866d58 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74285f2a5436bb98e5c897bb3c1ae2138fce00f2113438fa2ffc4f40a8734051 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..497bd25a2b848df9d005abfd7003846d696ef5c9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15114c3cdbda317a66e3dc613b359c1ce5fe697bb47940a1d40a69a6f4ea333f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.18.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.18.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d07a0f3e26317d792636a656dc9cbb6ba5d64e0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afba9f037745982f2a13e7a7c400b70f93bd9bf32e435764767c482151e4cb47 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.18.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.18.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f608adcd9ccd24512f79938cc83a0fe530fc854d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bfa497e744b9fe54c5016e30ccb7fabfc0d75fe1abfdd5db21c007669ebdbe1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.18.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.18.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d3bec0086b2907d45455131bf6cc5084abd02d2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff9bf1ffa2a2b19d82071128f535df8039ace361112371037d4c26c22a035fe8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc3bcf6668a78ff4d192d6d3ff2e53e279835293 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22bc2ac45e451ccf7fba41b0a24c33e04b2116e0c035ba23e071749cc640e2d9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5520f28871aba4f2a1d80f4fc5e078ad4271b76 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb1be459217214b4c6d98b27a503e3ccca3a7a59c65c0ab4d7a41cb7da126351 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f71bc936914d967b9aa6b4d2f2ff7fcd9f3d780a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1489b560b39b310a2f3caaa140e297784686ff965c6f58e9bbce6870ecec937 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.19.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.19.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..24e99aee54777a530e48985aff295a1d18fde3e2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9effbf3ab31c64865e0f1bbc990e0cf408d2fc349e0ed7570e4522b177e7d223 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.19.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.19.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2559aa2b189cc05b2e461104062fbe8e3e91098b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edb90fda57196acf1a028661519850e5ee7ca1275421d36867b9ba578acc1756 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.19.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.19.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae82401f0da4ecc43ab467a3eee010a0f83c2d90 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:873fea74770be7f2d4398e15fd1f74a952cbf840904ee01157975b5b7c0124b3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cdfcce68bfd9864fddae18c453616346600a6ec3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06e54cf4eecf1f84a74c7f4d0483e1e5343d4ca7895a885647eb79f4818ac511 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1dc2f5f35d3273cc738254086efa4041146d5a14 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c984932e2246e798b3894867e14b524f2e16ba82d5f372012b7d72aae081fcc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d26ce9965c8415232db37946221266ebfbdf0c42 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddd0572de3a1eb36b8dba60846b2d29bbc86a6a312553ae3be2c92d5d979ce0f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.2.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.2.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f085fb0dd2899a40f266281f0504b7f8415c47c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d4dd4302f7db374985bca05524944a5acb0beee61a725573fb9bfe7348efefe +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.2.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.2.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f38e1d400ed71fa63348e3c67dbbcea524fee26 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35859b3d2bad0e28cc1daf0c53accd8da7f37b4bb97a67b12b9c68b1249dca7c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.2.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.2.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd421399eba03beb497586d8ba4acc85c4826e17 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5dd04221299f739c86c6766a391609245b2b6ee4a4ff2ea6e546dfdadc138a36 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..69e03a9920b00f832c24cf5353848875b46dc8b1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd63f6fd15331b5b28c94a7a5e338d5b403bccbf3c638a29b9672424cc152c95 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..69b2d84baaeb359c5e8e2e63baeaff8c4035f57f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:065b6be035c8756c70f682aac49e369f0a88f00614a64698664c019c0d3eef53 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..08ed2b73c7b052a6649e5db04f6af0d26ec7c4c2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e93a57748d487bd8d647da437d69090500a9f6618183530d09937534517302a2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.20.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.20.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8dccdca940ba4bce079eb1c0819d816bcb8770a1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:278b4755c194f656a92f0f4093cc3cbb170840d6771decdad6304cf182283194 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.20.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.20.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..baa4a0be0d995400d3c1e4f45b0d9542f3ea1e0f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:352b2fc861b137f5043e345a658965878da769571ba3ebbedf9aedefa00fdd20 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.20.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.20.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eedae9ad63cc861d4f8491904d2eedece3824616 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aff3fce7031d79fdb67d8ba4a70cd4312559b349e7b81da362e4386bbabcc52c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccad2741c881a5d0a5031aba080a2ad66cd86d9d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a3d13238d2cff8163b25c3ee623b0bbf279355a974c879caedfe70c7a30692b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aeab0c6b751cd526a520c377dcdc259eb272037c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8b25d9bf27b330bb4897308e09c0065e5c14391f9cb2e15973dda4134623e38 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf60f47f5160b5c46c13402447361bd490e6cc51 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b53ebf8aa4eaad66be834aaad2955293b8835ee6d8ac5d09222a4fd31166a860 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.21.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.21.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8eed16510c529bff63ab71257f9e09f77acd90ce --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21c595f96355f2ba8b5514739ab43b27c4bf4c8322310afcd56e76f372386dcb +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.21.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.21.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ef23c4ab3f45c52c684e0ab12472c4c48c02fde --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e496634bae82d492571b9f1775478b6b450c79a7796b97c445f2980c370262d5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.21.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.21.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..12e6a16d1fa5192ac8130e2d4aa44fde6d021081 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fc114b111cab9081f904f6f475a088c187fc19dd4fc9fdb926914bc69a8ad8f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcbeb0bd26ebf2a772006a444851f967a020bbd4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01c45db904acebab7ec1c6db019549c1d193bbbb740a705d3fdccb93a2d7142d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ca4ff486d59161c235927318c35a6a689bcbfd3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c4b38727073579690991f2b43f6f485a8119058e7ea08e528db868ca7d9d938 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..61541895445f1d921da5cf14935deb52e00807b2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4f6de9f9dbbda8b814fb450a357665ac234f846836ff3b263d4939d2592c7eb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.22.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.22.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ec4eb63b912231297ee9fb03abd61e5373b44ea --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f48de93c8058a214813840d04134bfa7b2509a82b2131bd445d1405b062f1d01 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.22.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.22.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c72803af27d9840f95b4e41ef31e61ff6ec458b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd741da32087067f2a915105566aa46b550a719520fad09591e4b79a8bb521d8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.22.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.22.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7008faa668a26ca50932a946c008afd1586d84b3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f621f4062964afee75e0def84f7033756216092d30f9c0dd7bca9df4d4dad8d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a478e20033bf94366e90d9f3ff900c0b574d13b7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8ccd21bbda0cebadeadd0fa86353a87f9ab06e2113ef7e9d9f9aaf291a2b293 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6088edd6755424b8b99c7d33c5374b0d0d6e5472 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0db8809fe2e1da18cf7db9cd796e36e9ffd797fbe8d6a8ac9e597330b1c667a8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0952f4c59db0fd2b4cd3a1c09b4438771d795cb6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df23928f6c4ad3147a5b11ffe3da92152497434e08c1a3fddbbe85b98c99739f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.23.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.23.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c46d399a222a478e3eb5242a08262ae140bb51f6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21a63cb0dd400cdb772820385ea8e38df560834987712b5efce5c1b32779ddab +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.23.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.23.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4628a5009833ab922add574f0c0f66faef38cb9b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e719fd3c61b56ba4bb522003b52b182eb9bb1fefdcebf3c61ab84e77eadc9555 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.23.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.23.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d31041aa7810d2f11a46114bf21b4c4b0fbcb6e2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19c7b2639248d409ad9c30d8bc5f227394277690edb3a0c80a8181480d5b019b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ea17fc990918edd8441d8ba7fd78fa2d07ba478 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94583490325903ecba390b996112fb7ce015afcb8a6b3efe53b344d27869e5fe +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..20bd237762c78ee83e0c9ff662cffed89e4c7de7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98fcefaa43d886683491a4cffce97295cf710c590add10ad04291949c8fb6e81 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9694bcb506490a7ff74ec54432af237936a37025 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb393071d5ec7cbb004ac630071da96ec8071ceae990a3f0dd3dd11128224e5a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.24.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.24.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2134fd203b017349ad724df91ac81f121942a52d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7009cb4489e1f4b9c31fb9d6f08cbcff0d1cf487c56c33cc8317e2a4821ce4d8 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.24.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.24.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c644fa5037575f77012d78c7535f320ef7cd5b4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dbe053f433d6786942069acc15acdb91876078e4bea5eed1fa39e2a43bcd693 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.24.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.24.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6efecfcade94eb7c1e524bfe61a8eebe35d3b3f7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:160a708199657b7d6b3bcb24224a29325ec0e33e2a9a32a531e49ea715263270 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..24c76051990347f65a272b5e8ec28bed4d72457e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:209847af8d93df77b9aa1524d23cba5893084e43fae742b07281e7f20a8fb8a5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..46a1f7c8e01f306a3af7fd6772496e654f1fc369 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19c1272ae136eefb4fe601a98819977ee4b1bd4b68c608b96304b73f224ce8af +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2585a1d98e0d82cdc95d3419ba79c5deb6badd60 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e735a8ef63eaa28ee6b07384de2b3fee2f4d43beccbc4974aca465f2456c98a4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.25.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.25.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f0641cb890ad013bf436e6c6920c82c5395b771 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:423339eef05d70e36de90f1542605ef2942a2350182142df467a85a86e2c5735 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.25.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.25.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5597c63ce60176d4b367c7d4d74246c9809ca4f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32e6ab0ca99f9c24cf8f15a331f03dd442c065e7f6e472f5ae3b1992f15d7f1d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.25.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.25.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..14b27df4e2fc19b2e89c10e297bf027d96fd5345 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84e8494ad1581085276390a7aa4bd2fceebf1b86381821403d98da0d83065b0b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9417c86f2b060564159c9ca69d68365278e01755 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:146151fd98af263bce07b175039343654ccb8888a77fdc8074f57bfd15e4b1d8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1604869bca13ce2f1add1145a435321d30a60f06 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fdfee95cf7e09ca5b88c7fe88e9087b10e3b0037ac9e704f1cbcb0f300cde9f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..508465d861c2b0645212362f9788e0a74b9191de --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fca7b294d0a925e9ff70d552c07537a771fc3ff34815dc81ef8a1a2d7d486127 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.26.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.26.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..be955958bf53b1295b27cf9d832f2f086a60c7dd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59745adb300bfd342d5c283e68965bbf167fd79ecaafbdd041ea7a9d0ccb01b6 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.26.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.26.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..112834fc9f8a05aaeda52e4c09c7d67e84b1ce3f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c47029ba8d1133bf3878f3631b6b8730bed39a0d581d8a35a7a761fe0f7e26a4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.26.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.26.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5616c2d1ca28bc910d41a3e969a2a6f40a59434d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:171441cee44ee4362b7fe04488404505a14ace19f9c1bb3c4a39cc29555cacbe +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..171cf0946af4b56e33f474e305130d86472d85e5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a73ce7d41eecbbfe44a9abd2e41185a7737bf89643bded8bcb63b69a8cf88af5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c1d61872e03b957682ab74673e14014d46fcf40 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3515c1f32dd24c2422f79f389e8f7d5f77e3871f8aa587570c42a7995622771b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f2b246865dbcc999b373dae9292d0df7c4eeba7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a47090b513b19f8ce0cfcb8e3ca306f89965fd4d3519e4832c133399a855d7f7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.27.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.27.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..366aad45001e1d480ccddfff3207d89d25ac2ae8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c5b94610e9a2420024293b075696a0c6c03973c1b47cd5b254fb80dbb9095eb +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.27.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.27.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d545031914dab7429b37ca690ff37f1aa50f2458 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2366d2d154370a5a36e257c80ab8c9fb1b3722ff02f3f08e1f7c61996b77cf9e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.27.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.27.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..55d8d9abe7c8e8eb3f56b58d4dd0822030d34d94 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b8833f28fa6dd068f3cf7f83701f6ec36e8588eeb06ad7d2e2ddd6bc3885a7b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b9c7f98647f7150e2b3e172ed086291af9f96b3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6596257c0a6891f0373cf0a2d532d0ae7115ebde479510752f9dd0c3e2a9c8f6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..29777bb727e89b243d0b16b96ecb453ad8465a82 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc6656d0f4da2b298f831ace28dc3429b1185d0406808e9f01ea242ca76c89e4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0aed1521fc6e4f4e2e12648ca454a3ee6331a6a3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81965bef61610ff3583eaa17c03737f08dae7a40d00cfd550cc93072c7dc91ee +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.28.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.28.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..01b2c603a151fe403a0c97f9e4e748d755594ee9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7650630d2eb4d6a57abc6b00b6febb201048b6467f41538d44e732647690c6d +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.28.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.28.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cabfcbcedb3a342a3aff8c6336b51928a7a7b663 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aa121f40f26e3684b9d38924c6f98708d65c8a8e777f15efd381364aee24a8a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.28.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.28.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..80e7a7d5078f1e084b87c6a61ecb7c420520716b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:244d31ee1909161577a2d569ade6fd9d625fad0516f8673d2a3523d8bbbcc351 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd2b7b8b9d788e59198b944dd83b7f7281f2fa50 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:add8d5dfc93b711ef583f3fe25007965b5696b73d24826f9381687791544e9c9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5bc4d1e6423bcc100fdb4e569730553ac08a4fa --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23485920a0f71be7ab7e1fc0c1b2d80adb8d17f0d6aadf843662c27cd179c742 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8b0c1c1669f65d01c92443db3dad989ba39ebb5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79effb3348849a7ba49fba6ac9e5754c1aa99540cdca6e32913a976f8a8e5d4d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.29.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.29.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..45cb06c5342b14cfa16033ae39cd55a60f72ba38 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9db71eb7558fe44878c781235a055a6ce077ee0fcf96cabaae8bc2dd0b31554 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.29.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.29.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9865969366aa171ca0db8b63a281b402ec7c020 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a0fc180fbd129d8e5ee5fe970ae42197e38c48300d61557e2971860678ce2cb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.29.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.29.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..93e6ff658110bbac14e01219e23c4dadba9d7c4c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ef040930380d9d6ad04a411326198d24e9ccaedfda493ca2510428e088920b8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e31e11855cb8c9ec52f155b1b40c5ed26c7c7c33 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1df2531a3394f3e8af1e798ed11cb8270d643ceffc750659d2d3bf8386f92430 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe06e2aa1856577332ec60da6e44dc98bcc37639 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6efb3e553f804044b3783dfd625b19f1171475d646200344446e3ca898ccfb5f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9056016d6cc483b81eeef2371b98cd86b5f6f12 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d5598ca5bf27e46fd23580065ed027b67f22f5010bcaa8679a620fe5b20d1e4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.3.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.3.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..326d04780ea4360c0c4967d4a0ed7eebf9326d75 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:363fce4259d279aa6442ad1392c3ee1ad38452400b3688d7b84e2da6f3e00e6b +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.3.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.3.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4bf50419dc3106c5bb1944e1b61440341368f59a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55bf5817d8296a544eb0a9ac54e82c4bb675ce380f86bbe56e6705420e2cb94a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.3.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.3.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..84dae9120a1b58f1b0b4fe43a5425e28a868b9a6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e544749da3a2976df63ab658a4faa5f10c5563b411b354fc97f3515096098aa +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9eb300d82ba911a4d487172818fd33d45b82fd32 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef8d7a4e3789b0bd660a69be8611c6a9ba3d9398acf3caf478649dd56ad04429 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c05cc2e32d4c57210acf61a2b6a0668a7ec1a85a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5c021d0768b5ae505d3c09a7682e14c2e529f70f954f3f1ef00012a2bd230bc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c0b0c82efb914f797c95c561d1e12a7d6bde1d6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78905ccd8fb3da483b2ec4f4368550b544498af7eec0b1d1120e389a2ec4b9b2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.30.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.30.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a351296a81a981dd992cd75b3b3c4e14eebd3cf9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae9fe08d567cf56469c89a1a102dd0d3526c3eb79c6ce48d71b663db94e274df +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.30.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.30.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..55c71773e4397f7ee221a9eba74713f584955fc0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:603777ec56ee5d3ae9a3f7dae03c8ab4af4a3c57d5dfc5806e0134e7dbab7687 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.30.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.30.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f00fc69065c85c572527095852abb8c2de0de67 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfba47a2b5d95a86d6d270cfef528965d66b7a90657ff90736a907d8f78a9814 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d003aeec72bd8cac21e9a544b35b218273b3bb0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8590bfc18d0049fc13d2d890564c6c557737f17c0f9277b22aaaa83e1876f13 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9ff9cf456e2517bc3d027ace356c629806017d9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9800dbc4fb16568bf586419697d6c8bec6ba57e52d41d24e878642f26f8878f7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..15e8f98e89e0d6653ee6d7d662f05edb29af1564 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c766f71d822a9e8da4bac45f9c26e4cbb43dede4f30511b0cb87020393e17b7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.31.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.31.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fc776947c6a63710f4ba97c00252f73ab0deaa6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:477a7855d7cc0fac7b02ff26bcca8d819f140aa108dec32100372a42071bc441 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.31.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.31.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cef112bfd6514bf6b5ee55464d7ba587538d1c1c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23236f1b3d7fb51be7136ac380cdd851d2888bf701aa3abd8ce99fcc5abd729a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.31.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.31.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd2fe4b28d20c0bdbf0805a1255e9628830e7760 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d4ee0eab31ca02621fabc348d71e9ba2e2803b61d843c0a6fb7610e8da8e764 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5989f8884a6560d1946237752c1a1d996f2a054a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a828adf689d30cd8041c7cbc0c2cbee5809b704676daf0921e62d7d7307529e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e85ab8c03f2c0d39799b6fb5d16ba3af6d90034f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26216fa9307d18d19bb7b87785e42eb2f9894df64ece94dd670fc2e97a441dbf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..73646a1403bb17b72bacc4ab0dcb9b5848f33c8b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4014b8fb16941630b04de89cdb1cd4f53e135eb41915cea444ce110f3d26dbef +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.4.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.4.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ecd1d9745881b1559db58c4fc4228699f655a98f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09d9dd6ab3c46fefe77c2f81e4725ed475f6350ca68e94a4288944da4a6a0c96 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.4.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.4.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c9ac93c63e1d35ff64d204e5ae6597fc66cb84f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07f051b1a2e238746cec618698e6c5ce151b37d378de178b4963552ca8988c5f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.4.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.4.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec9e1a714ee4922308b8fa474740ea90681db093 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a623c45f4abb8c84af022b2d8221f2567a9d837fac3e3347c65df4e9a5e4615 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..560570c4a52cfd89bc35688641126ddfe87b3cad --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4593d06e125f07b8bc55073242b3eb37f7bb5526e00d827d76bfda092bb0f149 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..26c96a1cd1a93f54110ffea9d8bfa32116cd2ec0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09f8d6d90762b632c8be4e2bf2a772df09332c7d49f51b110c9c5373197cfc30 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bdb549c591d5fa53e7b7bc9759fd7b8ef85ac55 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b14cdad22294e4bba5adcdbfdab364ef20f8ebf179ebe480ee34ee2ed596ebec +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.5.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.5.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6dfc728f296c7c135df6311e5d64038c00bba1b4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e8216d8cac9a26bc611d0c34d78facec5db9055c92c99205f6b3782a173890f +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.5.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.5.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8f4a95bde0201b456fc70e1c9cb70c065341ac5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37e4e21455ee0b0366d31e69a19ca5ffc0edf9ee9fce21be9483f2f450487bc2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.5.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.5.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff1112df018d50e908d86a47e612ff0e2e32932c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ab0bf7a6148fee27496bb65893b49027ac155e7862bab9002596bb7b2469cf6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7002e18563f2b0d3619b7d5716ad1c472cf3c668 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c01648a7b95cfff2213e93f89407e364d579c97717b7a50f922a7de75417f6d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5722c04116604c0980bde200bf6498ad199f1d49 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab266c6d317fd46e943e46b4609efdb5525c7623a0c43558240f26a049c2c888 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..edaeb716a3dc01e802017f36c0679046c045b70d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35411ae83dc26a003726d956a37fee93da27aba9ffa452b376f53eeb3417bade +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.6.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.6.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9c3d15ef2e73ef82953651d797d72809ade3ce5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf4b39f09ca151cfdd81b61a5aa51ab3cca8bbea99af11f894f4b22f9bde64d2 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.6.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.6.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..97d7ccd2c4d923ac9dd5976e0e567ead781e537e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62a142b72886b3b650ae792eeb127baf95399256c18e8389ba40e0958155ebda +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.6.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.6.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab97c27a7c3619e0c5d22baf4c8fa02a2d9247e2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2be8fd79c66c93fc9838a5dc21af9dd9c9ea6c07c4848c5c4bf4f13f15235b7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..48310d2a319bed67ba88cd496a81abc040c59152 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:468d3d5768aa51fa1af15ebb0be6eed25d838f88ae683d90e78a7682f2fe6083 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..42cfb05aac1eba3359fe91212f1c88a9e82559f6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:280df2019307b3502d59a8313cd8332fa0e82a95a857a38afd47aa76e79ac484 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f30736230802667c451a5da63e5cc9724742fec9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c3047ffe2583305edced6e391509949f568c8c9935659e8a5a64a5d1722b1a7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.7.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.7.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..978a145da5de3f324b06083b4d1e25e8b047c244 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c83728db45187a07914e513cd1b43181b751f8a5ebef3567513e9ca61db969d +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.7.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.7.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..980ad4df08f81675e6e68dd672d7a35f80810184 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56d0f4950abfc4a6cf861381e7a597beeda79e8d2e36ad1e8dc85a0d36e456e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.7.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.7.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5911da7ede65137ae9662fe74967c9f1bb51412a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c603490be8a09c518ffb5034b953460b0ca1c92b2bb1190089cfe41d5ad9396d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e37c50dbd6147dbc7e5f28e244f0d00a21ae65c3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c65bf2caf78cc46bf28e13cb8def317924bb62b6532945ce55dd85fe01b2e25c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ed2ee4f6a0ccebffa233ee1db3d4dd3dabe5924 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ff39333870d508bed4a12b4330f486f09f02baa0bc5bdcc4f539830e05a531e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..184056e19ad621ab26c1209859e579c70c4c062d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1791ddfa87c6a5a819cc797729bd967e0bff2b92780cf7fabda184bd39a2783 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.8.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.8.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d28722a459b134c848db5786ae4f0e799045d254 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dca8b30f5175fa2ef7463a1373d410c5ef3b8337351995788a6dca5bd946199f +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.8.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.8.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..04ed778bfcd973c03a991ebf36b715f2824e3857 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:392f258ea6eb2a521b2e872914a057b47f513986a2044394465564f5bafe1cc4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.8.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.8.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..038acef39f61e0177dee63b6159bb9984b24bc81 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54a63874e7a4a18bc6893d596ab725015cffa7ee13e31aed1f45ac5045423260 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..747df576a9144a26ba78dadadc2b2a2b766ec4e7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08d79570616b84a82c4384a5c2cec7b33cceaacb37e54b1f65a44f0a440e1701 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb3e23389023f9ac03641fa1abcf8cdac5ef5793 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5674617706809bcaab2d0e553853517a85ddf8b36fd05968e452e051c9a642e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cca422a1f42a7ea26bb48bc652faf7abed08e13a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c269366e2ab392de8507685f111ca9b85d2376eabb3d97cbced4e8788821b612 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.9.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.9.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d19449339f83a934b357794d5adfabbbf15c509 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43873c8f7fd97c0973dd6f0bad91f95d394aae85893cc8b3a924c3de222f420a +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.9.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.9.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..25abb1e59ba8bdbfad18bc02fe34b74c47a6a0fe --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdd63c7d8f2ec4f89b0d6c99293972a519f4e43bf1c516a3fd3a0a0a5c424136 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.9.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.9.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d239ff27affbb781bca5505044e191e4d30befc3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b10a869c294fcb08226d95d7e1a6361f4f94974dc7f889c842270b1ff51b24ab +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..73a41051c6fe8e5d161afdf1bd81a8367f9824ae --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f6ce2c01f8ddc8b643c9f7ffdc79df0427c8a749cf1e383d5cfba7d8ffb7541 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7118d4877e71ae85671c584edcfb96aab5f8ef9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44a00b9d93d6fa2f8da64470756a9befd67c07b8202f90ad4d1b6a7ce4b6ba71 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..551f0e948c2f795ede50ac26677d75463b54e250 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/init/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a16fde1b406aee3d1faba85297ea486656a91b1c35f9f7ac7576c4a94120cec +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/lm_head/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a55411f858b3bd21348623e97b692f0b3ce2afc7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a65001dfc4a7793c2f002ba7020d8e82a47241e55cd97b1f47ed7a157e3f8fff +size 205955 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/lm_head/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..00e49f69fb673b4d6fcdefa06e6c7bd911426117 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13459e53b87550e2c668a14c17ec62631650e283dcee02abf516c839fae6acd8 +size 205955 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.0.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bcfb8ac4838a8069be16ba4a7a6aa604d4269a3d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:175115ee3fbbd19b16c8e40f675e33a6fecef91e39ffa5de354372906eb6dd3a +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.0.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..69639ee086a4642626be80e791c5a4aa455e6487 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bd056b0011c36bbaeecc20d30bb0655dc50db867b2c6b98fa592bf96adcf948 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.0.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd7bef0b99fd6c0559df5924cc9020c31f549e25 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c2f47f72bf553c64882e1de63abfc29834d874c4ced0163fd12cdbf5407a3e2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.0.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..52a9b0ee43cb33a306b478a87864d1dddd6db746 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2613fe5cffd465fd5bb7e0130fb051a01da024ab3535f67ccd9ca1f878dd5a3b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.0.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e5d85098421e723890ad01693b2de96676636b9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbe8e6ee439dce8caac717d200516d03eb9c42794432bcf360dc2ea664fd0e59 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.0.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2ea7eb3cab3ad7ebb1fb6d9bde48cced017a2d2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0138901c09889c000429722e13930752bc2e22134c48ea5cabfdf6686af75ce +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a412f01e440afaaabab3f7249c28df82174993db --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aba28376a0b18982a3126fa5917354bc4f0f451cd2f9db21add6c6d7b801d995 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9a5e3e64dc6816bb0ceafa23227d56606c5d28b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6961cf22f031e7a2ea1a28c7f51fcc1d06ace0b060098ad159a15a8837721459 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..54a1e28edd250eeaea05e7ff885ec03c8f6ddf33 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7a9dc9f63574c110b0eab4778fe21b78698f4bf69acf0484ab6afa103cbe36c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bfd29518ff26a4904cadf0a4beb30d15c9e9af64 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b53c5ed9e3d7ef83b7412c59eee902c6d60e3aa462da139d3d638c1d425cfa9d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..231bd265128b77e2dfeb8ae1286c74164a201216 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c450306c37f8c472ca91914dfea801d72a0740da22287f739073677ba992ae4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..db9c42e705e36da2d03633622ca3eb183039f080 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a5e0bdb48f5da44d8159ed687d504550df51aaace3a0217296d8443b7531a5e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.1.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c011f30fce2d240295437dde42b4ea69418879db --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e00bf88d3136bce675e5f03f14f39f6e2ec35be8672a491748cc13ab0e4140f +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.1.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6140f1aa219a8da71279842aeeac2e817fbc9244 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01591700ae3a60f54b9da6fa449754740a54c3776f531eea901f6a311d4fdeab +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.1.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..863f5c8ef6ee50bd4103132b4801ad029f87a4c8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f4461e9f7cae2e4ffb25d2acd073e3faae874f6058d37e623edecd49e81ff23 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.1.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ee814c5761ae78123752ea13b66f33275d972e2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1003963fa02056d1c65b1f8cd3296b648bd6828e4d3b3246f579ee4c899482c6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.1.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e7f7b9c6db1faf210cc0c933e7f7227dd97f4ee --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:deb3bbe9ab9a689c03b0cd633afe24187995e0fdda1b811d6340734acaeb8983 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.1.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0442331eeba796f5c2f16b42370873baf19a822 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fb55291c8e85d1ddf047dd622aa593a77d6526f617a9d4f4bc13cacd6b37db0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..255317c493c7bbf2a9b42d626cc39c859d06d0d9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30724d5984fc5960125781e08d3993a7ba2cc2ffacbe06db9f793accc41ad7f8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..206e5eb50e0581f93c2834480c26f1a5df851b7a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60bba354c3ca89338af8997d2fca53f65f167aff775b62839c3d22f9d587741c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..83640c5c92508bfabcd7ff4cca93eb3315471f96 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79135946ef03470ac6672ef77f1a9e8f07230721b4892c41ffdeb11fc5e74917 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bea8fd8ad4220a3c62b22553afb449286b0d29b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac21ef1834aa7d9fd8a2d1ea993ea1c417cf0f6dac365e433bb83214ea1ff6ec +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f17dbeb7a4588e8347ba49cc37fbeb6e25aaa312 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d71ff0db4739ea638dffbc17ef05b447b19ee753e239807491c6efa4bb15bb63 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..335517147de7d76064cfe8aa7c6cf0c4274afd54 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67bb724154e9cdae4ceb0c990f8e78e9814d65c1d52c30f15c1ce9e67281f76a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.10.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b5a7076a63442c1ff63d79e34927c3f74f986ce --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05fbd0563f2cc00ca5c2225b65cca974ab25d0cee72f2d5cc3362e11eb3d2ad5 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.10.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..30419d74c284e3cf2da3306a6d36aadf520393e2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30fe911e14a26f8ea52c92b77aed66e8e85c3561c9fe031d36bac01bf728d754 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.10.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..174e3acf6690274941819170d593ffa239e35e5a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebcc05d5a28d4d4fe53c5dce94fa12e4a03ae00939aaffac630f179e0842ce9c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.10.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6409c311bef028b3889fb6d9e2c4586b10540b7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7d384daaba746685bd3bbb3506171f83f89cab8e00e9b8b7668f70b888f3db3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.10.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0a88e3ae5c67d2aad442ff7aca9baf62f6b7863 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:729bdc230be6cdb469ff6dfd87c185b683791584142922589152719f0be94498 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.10.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5ba59ae8b1f93aad38b761ec21806f6d047b0be --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64f877b06b8f1ffddf8d6637aa7a3474c1b20bc20c4d6a8f5e1c45ce00e4da34 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4665b5ad0c6b6212ffb146dc147f93c16f72e7a3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75e233cce2417ada99e9fc10fac5002ed96f7528ff321459926049f5fdb84bcf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c05c145a5fe54a616d3ed029f0b95cca27c9f41b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8b6f169ee9de88ac9cd2674ca02f743516bb7ffc7ae067e358dd859614caff5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0033caeccd397a2178f5dfc581649c262a5c8424 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:889b08457249c251d88de829b7e12e396632683399c9538834367d2c42d6a045 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..095a42ffddd060e2c14f3fcf86fc9a7428f2b72a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:304f6feb1e6551e02eb7609c665fddcd58a3bd1e3fd8bb62d0b0c07718d60dc2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b4145b83ae21f4b4bc150b290506ce324d89387 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca4e8021ae8a5107cf8384b58b557fedb530e3bdaec183ce1681e6723a12ae89 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b25b815c9d0f0ee95429989216e581ba595d8c2b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b05a373e6a8868299de340ce6cf23a837cf58292455222da39cd9a3718010405 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.11.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..38559615d464ebec53e816a4099a70b3fae7a231 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58176a477338546c595a08ae1f3a2185ee3cdd59166e88d930be9b136d258bb0 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.11.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..570422aac4b40ed5f6a1ab3ae562cb8c384f4ba0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:599cf11aba1c48b07a896e905c294de7004347482ff1876ab713e9e93d6c1f15 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.11.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..54b04391c80ce642eec796efcdf535b0f472148e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9709b8c9049538d5b0178e02812e98d5a265af67a69fc50dcc11878d113f863a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.11.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fdd1c1818c6c3e35fe8d9ad729559b9f0d1d73e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8361ce05233897a7a46e806988adf5ec3eedd8736682981e79774ab0cc6a2cca +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.11.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..25ce60ed93d5e590e1c5cd1196bfe966c8f7fa46 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:660372998c481173aeba79da3b0d1266357d2957fdca590378d2bd2d6ebdd4bf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.11.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a2ff7e72ca9d717436d5876e36ebb7e6253d362 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b40f8f22eb110621b8da52f28cadfa0a806dac7f12598ad997d49b34a21fdbfb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f384b550e25b7c543bf75d3d8b19719ee9450cfa --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90da04c5d7a1236993ef124939aaa7a2eb2a44bf1718b332812ee8c61c8a3d15 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9edc2c5a300dd758961bc5807da5371a13c6196 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:704237f4c8ba48d13e246cdde7cf588251dba8f787ed918ecf413b3af082030c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ac2ac476867ef1b11e0c40a39ed4e44b6cf158a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6d3485f58de7693d282806d8a254829557e0d09d4ffc5e02c511857342de598 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d9652964003555fd356ee0dcd197de79d385f6f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b52c2b03b63e66f7c8960b1754bbdd76d8f91f485556ed8fbb051fa94ab75204 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9c2c2c750c66c066995bb1bfecf81eceed036dc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8f8065425878c4868632ac8acacd703e4f60dcca60460e9b1dd05cf26c35a08 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5657b6da172d0876a87495c48de5a26878ae1db7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e980b4f71bc9cd2d9edb81a1cfdc71a370fc78480169d547422c376ba46380a1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.12.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6508f50c53a66200769ce1e9fda2886463e0f33a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea5d06061715386d0235de7405b18345303aea9ef98288ab13518783eb74af01 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.12.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc14e020979390a2713ade10f435507acff6fbdb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4640c0454a2e7c5c997d3f2f6a04b7d251bd9946cd218f816715d021e4b7017 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.12.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..418e132d29ce59efbdc4d3a2f2d86ed039cb141b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d5884f26ba500c602b5b8e0233e6e94a224c5d6ab6088480ed18df7f0f68423 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.12.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..caa03776fc3e6b25489d1a05da1b5788b26727ae --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3644d5a36f24eeb821f2a127eb69679f4fe3d0a3d9a4536df813063e78c0eef4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.12.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae67a7804fb394c241e4bd3a9f6cfd793f15014a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75a4e74e21373c6829a4ef1396db9863c9e177844fcfcb50d070f2f2e51e8af0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.12.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cec09e98fd872d2735c354026ba89aef70d1bb6d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bd8c28048856b0a74194771879e44b0118d88b9dd4191998d48b3c043f7664e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e859a840981d3262514389a5d939c671bcb277cc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:543c0d713e5bae1e3db7462d82da0c5a08c7bdade3f8a2e9f361bd74b017cc64 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..30fbf3081cfecea261f63bcee17caa690671ed99 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ca8efda7add8aff137bf6be4a84972aa47be2c57918efc72298b799b604a002 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c5f21cc8713ec08a9b84ce858df99b89aa30844 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a61fc0d41eaad2728a0cf2f6026e8ec26981193d05983e0f4173fc615ff9ed5a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6dedea9f9a45ef5ee9ddf4ea7a51921ee9fd5243 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc8c260e79b78b8062d66f0ac80e205a54035d5081285b81583a5c7d5291bd90 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..45c74802c4241e6a3da206fe4f70c7b3b449a5c8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8a0bec6a9fc64df42dbc5f04268549bc37ec90e77fc16212db78f00095d950d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff8f4a8dae50f79fb13053f3421ceb7a48108aba --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6fb6892f8f02ea4269370cec3b0f57c87c95e8156a59fd7118c6bebcafb3508 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.13.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..451c9d1a12ab8e8a0ef3e123a8cf839d1bb12d8a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff8812e30ca787df33b87a8e7dcedbb115d80c0e1322f8e64bf590e90cc662fd +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.13.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fc15dd9db2dc352fa459a727b08338126880ee0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65e54b49fa6937ea848fb66b527411b796b1f0a7bbf0c153c7ea09319af55416 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.13.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..97a51f8c7838ca5c9082f4419d53839170bcc80c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1b380ae17a5de82bb2c77bbfc4582d3278e6f856b5495c611392daee25d724e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.13.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3bb7228871542b7eb6dc282c64efd628cfb11e29 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82241afdea487cfe8a7ea6a83908c404c81550a6914256c38c4eaa7596e929d9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.13.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fa2ac0149baa8e59d6415d9915165ac265e69e4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce15ee30252625f33ccd8efcc286b6e9f61f1928fe905425f4b8d18355e63753 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.13.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2aac7680847b3eb4d0bbada65194b25e0d05f843 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89d9503e44a4cb8a825b7bef05e6ce43ac5967f55b16f13f35961476ad0b38e4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..882600663215dccacc230a76cd24c8cbbb7a333b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b834145b95bb7a5c3f9775211e44fd35d5821455a24c8299ba5361070e1b2cd6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d47315a403d35ad25677d34278d4e98f5171c99 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b75f60658c76c745addd56a47c15ced1ca9e10852438a8de1b408987c471f47a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..07b2ff791d1beb1b11c6c2c7d1a548c0e6232a22 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e17dca716a5b771b45a283117094f5b6045bcec94ed4480d62a3fbf7bfdaf0e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6701dbea8c965ba15c78f08a99acdba89a7eed81 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de43a6271d0da3ed3e60185d9c8285194c9ae748cf89c6f0397a9b6fb06cd9e2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6a60d84ef9797e2ab5cd990ab48ae03830f4616 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e09ebedada3bfc9fd98c0473b078ce0d9ec8aac6a17ee4dc3ffddc6277c81ab +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3dee8b32844e6b4a3e7eb49721a92363e97d1ab5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcdc9f6a4cf842ef36cfa20b2e4a90120e6df01457dee35f04ca895eff66cc1f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.14.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b217a749faebd82ed075aa01b79f2f32e5037d64 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4165e34c5d1b88ffa9dbe8d32c5d0db319fa4ff05a4887cfd8abac9280d88b49 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.14.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5bb4efd8f817412d8cf121bf2efae2ddc996057a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e73425a38f99c270a85facd9d17249b43e3426615fefc8660ee2c3528083078 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.14.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce2f101ad9969b76e51afacb5d3c83b2464ba95b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ad72fc9a1ab3792ac7b03e1a42aa7e0451bc062607987d97d916f13031c2192 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.14.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..029c48cb51cede0a69f6fdcb531373a574dfef23 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97233ba379f054358326c0599877fc23dfc72fb842c434cea85695ee3a3c8234 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.14.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..78d57c6c846bae65990817ea9547c419f83311c2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdfd60ae0e771353cc84c80738e51de1d74a11383dcbe0afa6bf5eac515b1492 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.14.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2409d85a6247e1d205230e770b40e358ea1d6453 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc6fb11f0bab5b279bd85da3d4bc46aa3921707e2b648110cb94998bdab9f80a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5b99c89ee6337c14778e9bed8db333363cee3f9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d5979f51198476da8f30d244a0945ba998d6cd1f83a3c528f57e36fd184a68f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8edf081a6ee352d71a42033c46f68f2ecb49230a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f6957439229eb5cd1aa06614158983529d06d36389b8f0e2b8229d79eaab76a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..77f438ba69a2ab44056e312d41aa002989a0bc7e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e36d8a1083328e71786a4311cf3dc671f44e60e1848d007fdd79300acfced7b9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..345acc7ade0a07f07c190046189d7d4a559f0b43 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36cc4d1a0c24233eb5ecc721f3f7f33657636818abf8b56dd10e8ac35812c30e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..967ff63e507018628ea6600184755f3bd32c9be1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ede740c4f4c6f332c00a272674c1a2a6eab44e21f3560058ad63c22127ab2c90 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1f5044a9fa47069dd99aa56384347172a27d5b6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:902426967863a4f92c42a841e56f1371f5ce3bdc3d5e1101ae72754d76ca1c41 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.15.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bfc16e35939696049ee7a0b5acf6b1ee1dbd1162 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70591fe8ea81e89b45d28ec04c1b88867860592ad31045ff89ded6179526ddb6 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.15.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5cae24a3c720d83810e76f9cbe8e843ca7b7324d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c60ada9dc89daa2b7a6847fc266091f16f418e8504da2e27a7dd9ae9aa7b259 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.15.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..15175b227efda5529f60801941fffbe6814bb74f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46d5250c41a6d72926351aea8488f2f7b2ab05aae40a4fa0a61686f184c9de0f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.15.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bc7e3713f4afa71e1dc55b29b8feaa7ed3b05ef --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dd60010e0944fb8c7ae625ff0eed292ae611ac755f8ed68e443e0f7b8e2b9c4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.15.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d953143485134edeccff5e805d34e8cb26e0dd84 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3046bd1a5fa8bfc888ca74b1e778363ab2d5da9cfb173530c13b11c1c8ec080 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.15.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f84addea5a132e4f1e356668693e4d3167b7e76 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ff250feb26b296187c8aa990a3442db4a76b71f4b6d97c5d867145c976b8738 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..473014d4a18b497c98d5cab86cb340cca0b019df --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59f1b4f790ada37f3cef9da20fda22b10d72b55346d667488ae495b7a8cbb69c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9ffa493cfd4e144de1187baa87ab559eb137093 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb805fc9b8a753806e05a49e348dee8c554bee90f822c4c3c2184f762ed81646 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f857d5324e826822b9a423fcff168c70b03deb90 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19bbb6ffb3b0dcb48a5497bb212f86819fbaf6ddc6162bc13821420d6fc2cf79 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0e161ae55cb3e8f7fa91113008a7192ceedf8b7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9649844d43312722977821e0ae645f8e32828deaac93e34ca08aaa4f9b9843ce +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc23721283e9da37657ae9f36a5fe2263467de48 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:468daba4a45b5264d142f8293154513b7614671bed3402ce281edc1ba706c33c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d17e2b6ff5e20556cd21a97cc6c442ea378d943a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c9f65dc332af73a0716d10ef962f9f60ea5c74dad1ebf3136ddc0053097bb90 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.16.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6dea7c335f2c7b99215d935b34a372e6fbdabd75 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb575c7608db74b98401d75fb0c1a25f668558a102ea4e5fe6827344cd809ad8 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.16.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d1c4085e3ea7a4588b81045230d90d7993d0420 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:073d668e9c0502634cfbf2f614482e0b75c240e4ec2aa536086b5e81321e5156 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.16.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..562f00cfee3f71396e58591169122e91d25157eb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a12eb231e20cf0ed477dd3bf1cfbb04ba2ef6f5538ff4beaa7e0873569e45ab +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.16.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..19ecc998f3ff69d7adfe47c77a5b3d1df16df806 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73629a6df257468e6bfc7f95ac69954236e266f5460a017c695c130efbade4d1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.16.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..93f4a76c7b9cb5427b3cde05ce576ee21421ab4b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c356594631f16d02c1dadf48e5f6eff928ee323655d1ba1cc99139eaf8d8a0d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.16.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..84b8c27d1a0cf696e76fde11780f9233372c5ba6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b3928f56c6423587bd4b722b63cef8b6e0cf21556ba52ec3101e627e66fb47c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c116196eb17413b694b663c490b90919240aa858 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6ef2d6e670ef1471a1a81b857ff43a49e227d4f68d9d5e8996980cfcb5af36a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff3aefdd399b0b5af935be19dbf1a0bba1ef56be --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7514db73118c50cf7a856b721bf121e5d2ca431210035d1f268d4919cd06d3b6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..06d7dcd0d8e5e8d179076f72c53b317a154b962a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a5839c96d4a87e5a81de673211c0a774581ff05e5b85b8e390ead8dfc80885c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a61ff567cb7df36a0f4b3b13e0f1b5599910913 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:962166e545951db38ef454762fc870cdaa67f50856793c818a875e41776554db +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccf760401fb3cacede3c5132aec1693ec991dbc2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee7644fa53586a5e381ce68ece7bb62a1f1fca675fa5484bc3c34a487b33113a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..40004df28d156d504845b85eebd1e3ecc684f814 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b403cd23650948fe479d49234ba025d51b8e0444ec4a521ce01da620ab989e9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.17.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8c1cbcfca1ddadc79e7bf4ddc2d194ffe0c6d89 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16111651c5cacddda332e24bc43a31f81fe1ed7141db03d65f8f9a59678d0229 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.17.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..86bdfaa41a22aa072d63cbe85ebb31aced0eaa8a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d86fe6d0cb32c33aeebb65ab98660b280242b03a2d128a967f0b643a6237108d +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.17.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c10923ebfbe7f0cd527e70802edb66e4ead1d9d6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fe28da913f4625b774adebcd08bb74faedcea4b7708e6f7e7b3526e0668f5b6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.17.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cefae4c3aaf83c484ece3e1bc8f54879cbe3558 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24b37a71039ca4c2c968078bf56e123ed8479f654eacd631bf4e883b45288a59 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.17.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d215d5734f0e5534ab4e5e3775f92a952933c25 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a067ff9e789ce78caf0ceafff54475085d479eff66eea985c204b3cae5dc477f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.17.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..70c966a12d22a7c4de66b522845b7fa3223d218b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1da4451b537f56538840f57b7096329f06ba793ff6e30487fba7d8367b3e10d0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ce50f3c203853a5610e554eafc9de7bc4b1ad13 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99548ad3e372e4937ec5fd110a05e83493eeacd1de01421b74ebe42c86927ce1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e78641353b8f513a9af72a72f6fea906da5f81cd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:054cf8a1e28f847e4558b3f3aa6067b9e453f1e6aab63deb9480c08cef3b52c8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b9d902c66c14b8f39e0fb1f1ff6a14800d09311 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:571f948b597a21ebdce97f9588f72c22ab71560bbb65cc5e88ba9e1d519fab9b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..05b52270628da003acb49fff6211b943f651b750 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1b295a26b4320f986cc5cee41eaba0ae0deb5a6e88646651ceada90bf9a7ee5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7122816a20ec3fcc3e6c92997353ca2bc7306d65 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c9cd8096eef4628ce5d3548701c22ce77accaa9bed61d854ce9c7829e830fba +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f0d1803c4547455be5b219f11ca26e88353b496 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6af5fdb65d6ab1674044363c2dc2b3f27908f0e1467fa6b8fe0444928deecbb5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.18.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..df72dc1fd1894221dd01f92fad11b9497d8e2530 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b2bcf56b3d9623caa3467af953445841049ce82d01132dbd0c039d08d58c893 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.18.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..49d630fd5b3fecb8419592d62d852397cb1fab33 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0d18bad460cf2c46b4a5b966d9e639ca81c644fab19a098dce085f6e890ae2b +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.18.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b3553bae1d0c5902a4fca7c5a12aade9c92baa5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:314475342c6eb92c494f47766893fa8f1ee57d90af2482390e142afffc01ae74 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.18.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7dedfff13cbcfacc1fa9a97e7cc9bb6ef664285 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f21665676a8abe78390ca059221db5a010014817394e5a0d8ac574d30f11338 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.18.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0fb48690063ab7843e383909ce7c750be4e42de0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:916ee87deeb3f61e0c8f62584be2b7431fe86738cb02269b65a3558b9dcd9fd7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.18.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4e650a4d662535fb88293a629afd50297df5dfd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:507a0b0d6d74641a542d6ed7e747eb41a530b188f170909e7183ba5ccad75a41 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1cb495b81576dbc23e6ebbb63ff8726f1dbb738b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96522187fcedd716d0ce998a2d5b5a51782ddaac996e04c11d62035809314e95 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..68b0dd9a997f6b415711e8d9657dc661b4784e20 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcdfcb66de2e9206103fcc5de57888232308c95fbb36bf4894a9325079670b74 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f634f9f6722f40f06bdc0984cc7187d80e669a6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05d16e64688c1439d4317fe4cb7ccec245bf26b2dcb7220e701850f027e5b715 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8ca76254ddafa6aeb2152ad84d5e6725cb30f42 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a09c4499a9540ebb9249a08d88ab49a3e0fb169a697811abad6f80197b2ad392 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2f440ce427f6982b7a6dbe0c21e04912762a4a9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ab92266646801ba08e987a6414990a16327f8d90a37afeafbf360500abfda1b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c8b05850e396e5f9348bd6aa0bc29506868ebfc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52147eb43de85a7dbc9d4f94b863920951f74903d72e8eb53ae12cf2d6b248fc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.19.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b43ca9631c116868598e4360f72791f7fcc1c8d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dbad29d00bc0098a07583cf02809743b697cdbf4790ce4cef5cba83059819f5 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.19.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e4aa999bc36a85b8af223e8709eb509ec10815b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3410bd01f85652e2cc442f66a4f2001980cc0b2fe5db3a30dd74845f2e1bd20b +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.19.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e55fc5ba58d39f6bb455e4cd5084ed466d214248 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:303b961a62d70b92dbd056c312a6ff8a66505a19deb3672ea78b0864871a5241 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.19.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cbd8cd800326f14fff8586cbb517192a04bfbd9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c5129263fbe82d8acaedbd0c2812514bd65a4afe321e5933d9e5171af11c9da +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.19.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..350d3905e4e0eac010a63350ad6843380c38b994 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91525f95456b16c8db8e2d0b6806a6115dc982da834b4e0b6db1a0ec77998d17 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.19.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8eeed2b9d3156b496050d500480fd8135641ef42 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f95cbd621be1ec0a753780363f6d9ea2f6c42931b7090d1b3add406ab00f072 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..67c1a8eabe7c79ea93ba72692b8212e1558dc48b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c964e40f18f75d7ed32d62ffc8521cd38f5888d23d3db0af4a5dda92cb221e3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce901020b751e74495f8ef885225c6680f4238eb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e885397a844820d7f56dc7c0835a27ab3ea152d8d47fdd1cc8b7522d842c20e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca0e16b20a888d050522a4033eaf58f22dcf3bf1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bdd2b7db0d8478e14b9d04664ad676b14ef72929a6ab8a03023b2ff6b37bfd4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c6ea8c8bbe2dfd670c4e01882ef4b987e1f1809 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8124ccf867b91a41dc696a62927a3f8c1e81aaca33da503c3c9bdcc939595c9e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ee4d81e2fee800528ec27246412830577c969d9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb6432eef8e7c7f0e4e2df128e3ab69fd3337ea5adc6daaf456483197a7ca3d5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9b1c39118f58b9333744f06d0e84f6eab440b77 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ec8437e187e1881051828015c307ae964a089753ecb8e640939aa8c705512f4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.2.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c97f3f1cc04b61872779cdb8f0de18d8663ae2e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dfd580fa83fe81ceb3dd86a6c2e632dee487f4b28d6de02ce3effc8dc2705fc +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.2.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..19d6d708caf2571aa1172b92472fdd3bd4b3474e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2277ed349ff8cdd6e0dbe0f6368bf4d83b6e865376e7e8f07df6370ee056ffc +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.2.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c50557eabb9fc6b4ece596502115dd6010ddd87 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5425738164515f3922dcbede7e9e96c9ffba1441773f18bd78eec2f65b10eae +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.2.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c16ca34edd56502ca38da65ef646d7e6c212ea40 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dee957515b00739b39ee127e03d2adb744f19ba06f0c05f03a7f3056ee044d7b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.2.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..94a8c6d4fb46fb55bab80e747c9b9a28c3c4bf93 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a024f5a6c71d82e5e081e7099061fe816298e6e1e654a85f54ba994e317002ff +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.2.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..814f75efb2edf0f604c6a69aeed36d4fa4571c2d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53bf2f15a61b264ecbcb8815e02877cc28e79e941c8da0aa11b399255889df5d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..095a41351437924b00d7fe4ae9863d734407d1c1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a800a48c0b133d3cfe134750f706cca9bbbc009c5b448a813d1f6e06ecad0a2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..16dac614027466d3924cef162593b77a48e68471 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cae16cc59ba086adf13f24f51a47e5fd206f98e54d87322531d42f6c84c4d738 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..23201e05dc7cd73851504055047ea5b260f1ced5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a08d4784bda3348baf20559e686e7911603c649658fccd3bd8694fe43195ce1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eaf87c7c0eec47ecf7a723af2fc8a00c4082af7b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ce471bc7caa183db0f238a1eac2d089963b760860927977562a5152075260b9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c808a4876c9e0b64bbdbdfb427c76abdf440620 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7efe4ababadeb2602b3ad10d8bfc8815a01cb8ffd1e609b578a9237b932715d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e73139b33319bb062d9a1ad70b41e9ddb16ef2bb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69af979b9979fde96be57c0edc7df9f70f62323726d42a58bda15229b0666a52 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.20.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b7e5d81448414a03fcc39b946ead0bd8d20f04b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08437e79b422b1dcedc24e82ed04dd8547583dc32fd24eb9c4f07c042559e216 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.20.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a347513310ea9195c1c1753e9a56c2013075ddf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bf783fe6ebf52e1af4b6c3ccd0fb0009e585541ac32a3611b0f69faa00e0666 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.20.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8a03863d5b4438871c25959971034c90b91d76a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:216fe7b366df57fc3c512ebfaed63cf28118f9f72c98de6b1bbf21c258fa3d4d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.20.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0ec8012e2ed144895fdcc78c652965ac9192a0f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:362a9c3becfa24a62ad1f789328b0b694eec2c4c94d53bc1f8ef63311f57ec86 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.20.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f49c29ac7f095e31633e2de71f37ec59325eb4cf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9af83f6ea147a6273dea698bdea61daa14d9b415f16e442fd0e1434a155b0125 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.20.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..52f63d691814e9bb72ed1471e909a252804760cd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f33f48a854c048a820c3c41e9336a353cf437cdd4d687e74552eadc4d91c05e3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..66674a9b3525f2a010fd8effb0ffc8e6deb76eb6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ed84ee64c7da1eb8beb46181c6343d4d691c9b6558250545a18208422a534b0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..48fbec0fd78d55352d26136178ef7696155d8e7c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ae388abe61baba7fe8067087074cc1c65040279397d86b5d97e8254e9fafeea +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d55a71bd3f9ead160a0b29a98e1d0cf8e13147d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87c424b79464bebe8191cbdaf8713d431863af007a875b18a88877984a25bda5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..14bd0abe48253ece8fd8aa05450bc433e1e564c8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b52d37520d4e424cb1c999d5ba49f7a5d07d8b70b6af777e06bcafa0f84becf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..537bdcb7bdb58e0fba4b351be0ae9380802aa7e7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7d81af4a474e3607cf74de6726d9fef895b27c172a26308bc721427d6233527 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ff236988b07665512114fac936ed6d69acfaa5e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:910604edb37451c715b2feebc4f1ada8aaf7a7f012d57771dd4568e214c935d9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.21.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebbf1b02d2a26303a09c02493eb595bc0b3c5080 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6f8ff1960f83873c657c807a8d4ba6f2e6a78346aecb5a676955baac1229d6e +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.21.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9fa12439bce23c24dc367e50e4927bdc8488c4a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf37224333921e9123ed98bcb5ba3bd6a5682976b2296c0c47c6486a2189b2ff +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.21.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba320d4f3f18ab1387225ab3a0bf8d7c83bb9704 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e4ebce3e627067c082c9a692c44aa72e1c6f34f08e98df72099c5ed60b23156 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.21.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..10e6c84f33f004b937f8ebea56a997a595f87d73 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dded7eafe59f1ec7bb210b834b52d3215cc9a2d40874f900b6633bdfe2b6ec7e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.21.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..28daf9cc8196bed5614fef5e5dd3659dce42499b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba5786c023ea9354cf3b0128cf618b9f3272aba817f15b168ee3df6dc1c9e227 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.21.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6546b50789efeb0dfea56317204e08144b29a031 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ca46c67f71ee4b742500723bd1bd4d0de668eb5620de2b52b97df0e90eec4b5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..85378f7cb72d5b0926e2cec9a9176d6923f2d40f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0a292ebc10ee68cd8bfceab2e1de9d83d0d09c9d73db3479279f9169242cadd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b75911e89ae01f71f89455fec61b6f03b3db6bfb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbc75ac4f8b5d4ec37258bd3b122112e073922edf07aee87b4f8e076642ab350 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbee1b0bc61eec4de970b831400089cae9ad4d78 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e0dbb9e12e33ae643de23131caac9e8d50c53a8414fa14050d421e1a2359c0f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8dc3c289c8d671ae3863e8135ccc91905674e11c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fe156e3a0cd492bfd764dc47a22caab30b2b95faf1fe0d42f87167a839d7b8a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ee52c89ec0d6eb5841058a8417d6b071c2d07d0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b46bfe66761e7e329b220263e25ee91d6f24d3a5ccc07c9af9ebadce9bad67ef +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0062cb456e7e9437849b53302854ba30615f5025 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d2613371a87f249df823d9707fdb67d21dfe96199617e7714f6c5019fae5deb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.22.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b315644d8a7cf74c2c1a2692f515b09b5b5a42c2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0e5c8360dd800d24c9d59bb7ef0440a9dd95b136eef4e5325a57fd077281eff +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.22.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbfbce933212845abe7e487fce5196668303d9ad --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:590c8c309580e26bf12c3ef2ff96f661041050d43ba616f39f2f9f19bb640fbf +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.22.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..db1fd7f2b520ca185bb1c85cc3da448a58725ce4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:341bc2a38fb30b6ea6cafc7a8838d936c7f804c9190eea9d0192022f45712f57 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.22.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1de1ee50a068401892406832acdce19cd1c17ed3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e0354fc9a5d6ad552b91db73bf13b028e357f637ade665de204d117258a58c9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.22.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..eab5d010382075120334e65fb32211f186633852 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4d47a910be4bbe5a9c52570a7da0010e0f6fa33930617d89c41fe3b82bc5236 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.22.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c7deae13f059b5f6aefef7f3148d7bc9d63f9ef --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8857af81844501d728d3b08e11f970ca01b30f587574580b7c16b263b2c77152 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..78a82db57b3df8c85c348c38d1918e8e903cd2ef --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36d4d2c01c1c4a7962f4aa1051633fe4b75de9b892fbb038a9944428a2a5092b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4bbcf06426358e379fac1d054a005e6c2916094a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d81f2dd45441df4a27f00f9ccc0deed8a3a43c8eb7c2b5d7b4b79110929b725d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6672dac7f68aa8a595f4e4e41249c35840c07e8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a4eb191f194042023a05628845c59691e380a080e19182ffaf7f743a9770327 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6051403ddae6de25b44a56c1852f878ca6d1f9e9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f15e6266f8d1938030298ed2f6d977f0754556c6c611abc43f278cb181427eb1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f52bf01dee9fa01a67d9e44c2eec62cecfd2c375 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cab6240de432e0b4b75ca9b860f88cb50e3c048cbef7e5430341f3f9c3e4ab5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..94748f0ce3194378315a3392c831d428295f7432 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:884543979b7340ccfc24c97dde9d084dbb5d18d6379dc35f0691875ea37348a1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.23.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..be85e04ced481162b04784edeb5a67038a97b62d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa60632e104984859a108df6c813facc89087233e7f5cd9e0cfe154acc2343e8 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.23.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..64c33f2e0c8161ae3ca2d5e99956fbb21e8d7eaf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04a15222bff15dacc562050cdeecb8515b55a2a20ac836101aa9f27f5c6a2d41 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.23.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0482ac5146a5c02ac8696d7f44aae48d61cd1be --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d510295fa167097f3c0a7c875e6cf2ffdb1ec789ec0c4304c43f605f45e03502 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.23.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..510b57572776233e221e62ed146a16a4232f2bb4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0811e4ed4e126d1b191619e378eb5118f6add198dcd77da680092d32a25e12d8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.23.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f5efd997ac9ba2ce88f977341669fade1b46f63 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bd2751fab66ecb2d100e7762c46b6c473c99eb563a2cedac6f7e051ab769262 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.23.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd74b445673052410992607954913ca582bffe83 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:714036b667105b638eaaed495070fdd1c94d55cebd03658af702e109fd4d6865 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8bfb8a8212b097016c88357158bad48a9fc5545 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c87278cb5b78681fa820e8b94de467960d10405838073125cff8f191ce6cc3b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ade60da6a1faa641d99372ad6c686785b76eb2ee --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:792ffdfe1e3b4308900967f52b63b766eb89853571a725781ac7aac8f35aa971 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9426133e85bd13eafa8e6aa8e4f30b1886c9f8f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96c2def0ceee4367bd029ff2ea0c4a379b733ab88f529a4f49533e1acdfe55fc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6bbdd20e98d335b1f121ed1c5b9f821a1af4704 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b9075e55307636575370fbd41d2545bfece85158fb467f41ba98bf3364c5191 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4afcebb6efe601efaf09549587e89e858cf092cc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f4ca4eadf244a24d7908ed8438863a848db16fef1dccc1abb9284d4bfce081a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8fca68337f97c1bba27b1a36494f34ca58a05ca6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e546dc026900194c2a4d75631cbcf4061cc69c86bf001ce7a25d3b81a2705639 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.24.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c476bb423c523caf7191163534e5f9cd14816843 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0eda1670987185b0921a981f3e5d6ee4f474a39c20fc19e1dddfbbba4c3f7cb0 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.24.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..461910577e1eb928a2506c9e44aaff4b514197cf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7f6e0095df886739ffe75d154403cbcb57d6e9bfa22cd68f0a50aaee11b29d9 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.24.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8cccc552fd6b52ed9432381b82ed8fcdaa2b6079 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb4cc286d52bf12e748d83fea342af702c5c51648aeae2fe643c6045f8ddf84e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.24.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0f986dfea4b4691b40597e7aaef3e2533df5c8a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8331a0f38bfe57321280632d760f31f5728aefe2c5a1f22781b8aefb11a09d34 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.24.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d11d03c4fc565ad1a5e50e82a340436807d4482 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69628162613cc77db2bb475254505201eeae085e91f897d00a49fcc3356db239 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.24.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b672b0a1de0e45350a17b0efe26b3f027f01a1ca --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c907ce77ba5bf86dacdf8be5d86d33e5c9dbbf4f8161f7e06c14c8ed2d1762d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7ad2ba93126d131ac2fb657ba4224d4d21006d7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:368224e894acd707c9bf63693a0c727adda1de169148b5d3859b8c547a4e2d07 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..19581c0c3fcc71a9a7b13354d9e405a871ebda4a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f16b6c443dedb5870e8dfe510ed8b3b3558adaaa0f77bb7f7ea1b38ef3544aae +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0ffac5fa1e96ebf50d812e3b402ac8c640e12ef --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa30a28f9ed920fa5dd278ddf63bac02276e784240b6d3969a1a56c6de02169f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..55a92245363e52e14d8f265786adfbf18057d877 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7169c3dac8e7ef64482a186bf2dacd4600f72b1e5791da458226cf04e256998f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a717756d3aa4921eb23049f9473ede67a8e9356f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcd5f9eb79bd099013551754e8a987752e412b48d62f3e1f5391c6cbabd2935c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e482b04fe3222483a11a8d87cc2f5afdde00a7a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:990d5baec9305ade83eafca0449d3eb1cbedaddb38c9ca8c8c3411c9ffcbdfbf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.25.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b658867fb29b0598a8a6f90fc084bec4740ef81 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e03e1dbfc9516b7d0a5073def4ff07451908ed267c68b56364b9845352991898 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.25.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1528439e8b7d4ac5acb389845e40359c868f63be --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57490142ae3f933000166962a39bb4853c302eb778efaf831ca76f179250c016 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.25.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c4dea107d495f66d0e24b00dcca400b9a3be19d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77e2da771b57a7ea903e1ded7d24c1e7e85cb2c7bfa0c6e50aba4b3e4a9c4b3f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.25.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..49bf924df8541ac8227202e6719cf055a401d5e8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7bb529b5b0faf7f912624277a6e8271b74e01f27317d5acf1d3298889512609 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.25.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7581ebdc1eeddda42068188967653bb226d24596 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46f44beb530f228347319197b20e3da8c1a0cb4a1817d39987ed8350bec6aa24 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.25.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..856988952f5a99fe98b5b10069fc55b3109630c4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9676f25b7ac6cc168d4df86313297c53ac7ace7a69fa69d6f76cd817682f33fe +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9f575c8f05bd3931cac3bd60cb788f14d243865 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:965a7b0885977d4544a9ae42f7629de3b910a6bc0c5028b8b39703626f177a1b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb30d9e71c5bf50fd7fdd964f7cbe81593857493 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ab133c3b6604f10e3b76ae9ef55a1bd0ed32323d188b93417bc043c4b676c79 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a966893e11aaa63388e25c399625d8431d1d8b11 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:210a6b115d50cffff1f87b7996b857fa30247281a39b597113fa0abba14ffa17 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c4523db6efbcfe85220cd07a805663cc531a4b4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7e69660be4e2e83b5ed8d1fa7298608bd79403531d74dec32a0c7afab7280f0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad8f8e87e97e59ee55cfb2334b99d2e3ce3554a5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ed9c1a27afbb821fad308bcfbca73c85bdd1de430e3a8c630308571129ea848 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc3ac9d630a07604270aaa9d0965063668ad397a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f07adabc9253fafed2335a6374e4587a19d85a2ededb2daf40d69897bf6ae4f1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.26.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..896e7f64bb1135f337b1c9a741a07d4de6c4140c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4cc7c802e496180b2e9cbff855c21ac431293ba93c71cec37b89ce62aff6ae2 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.26.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..014d9d5344a9a9ad65523ec2db966404b5ec093e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3902a9e1b22750838174629d31fa2cdfa633011ee810266a637beb875dfa752f +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.26.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e25f0479cbfe5f70bcb743418bf41c76651adb87 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec0db28a3a0ef6503359885aeeab36f27a104793224d6a8b37e5c019a1d0d24d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.26.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb9ba7227bf0f541b49ae63db7408411cc5da042 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c594648f7a77a7c8aa64e27a4d76abf1085082faa0b889235be6ee6a6418222 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.26.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0d75eece30cc22ab17a44f05db606a8dc701fe6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bec86e9e8be75017f8ff96225dde561efdc7fa92313403ba2f1877993d7c937 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.26.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ede8561142e4e9da6df36b7e0cecbf1f70d4b97 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11ed9b8ce0be43ff059d04368a09c634569bd7cce9b8d286e8a54da58b9c4861 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e824eee8f33e9465b16ac58aefab1da54226cf81 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e45d96153231e8573ffb9d7e639d403d81ba5357d5ca1af2ee49f39be3fc5394 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9bd7f4f9721ff293f71eb109ad1d3f73c3cd928 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53ae6d0819c45ac4f4453ec746c6cf595540943c7cfd7771071d675e936b9280 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebdcbc1179940ae2ab917363f7072311a2edafa5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:577f6af9701a62019d8678ea0b76e44a748841485dd8bb3f13a464d9e0395b07 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d566b406080b54c5820062893b2e154b0e040794 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8e5ef1cfe7464c8d5a9cfa4cdd2fcd8cd9b09c1f883037ffab4d86cc2d8c4d3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d69b4151312306eeaa38397c495b68f388c9bdcc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0057b47c4b52d9fb6138f5dd5562b46ca13b3cf117c86b77475907f5a2507a7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7b7ce5159dbe20e3c2d66f02997023848959154 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d45673627b2de2542416a452a1917d683ab081222aac8658b014d54defec6f79 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.27.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..11d8a2d8889dbf8d39c48d823f0a50f949a2c5dc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b07d29cd952ddb480c17719ce1e87102482e1c853f469ae789463b17ea9dafb7 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.27.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ac9a3166989aa5cab33f6ec9934600a2af10628 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6424ed0726b804a79faf88363b59c23b9c702f8765b4139b2127b58c248a1954 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.27.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdfe665767d2876d9969fb76a6a41e2f2477ee3b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7691ccb28f1ac9b62dffb187c8a4e08b8081c88e00d6cbdb8a1355e71e0668b0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.27.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ecfb18c7093a9f2f44bdd6481817f914e6f7e7d9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e14803049536a754f2fc00c5a66e55499fc65c6da7816a896db57fd1edf816db +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.27.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf0cbbef14336e07362d06b682a58efcffcc0f72 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:133fdcaf294eb729544cb8e33812f6a9af4c0662dab84c56915ce949a4583cfe +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.27.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce0b17c94ff0d0f68780044f34aec5e0ac87d7e2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be833d2b61e24143e41e7b4f6d5049e5a69ce5f3858142cb88a34dcd4e1a2065 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc307a01a5b701d5af21a6210da6b6aa783ca59b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3736829309617a1f050b5ac858354abdb3a4e51ba562cbab6f42bf0f0553814e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..25318b849021977ed4c0a1013454c7e901fb3ba4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d4eeaeeb6f8b8426c77a7545ba4d6b31be0c29360d2eeab3f452a4a761f501e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..89a2821b8118bfba5fb530c5b6a8ea74d8fddeab --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52caf2d6b75a90a1651d1ccf660d3ab5a0c14e0b610e760d90d3734f3c5fde1c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..722bb650d16c7c49bcc9d2cdfece9eddb7989637 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e26206800a4931a9927c33fd3def47b83a418da90b8347e41f96d608512eda4c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a1e3dd110cd59d668b687b1bd151bd804934116 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07b62e1a20ae22a2fe2c5364e1fc87728ca97db3ed2b51bd3e97eb1f46fc4e00 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c660fa75f8ffdab82b49e472f241a14cb158d014 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65da0b6d283cb1454cd451202646edaac48d65b33015dcfc0ecd561d96d6a243 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.28.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9cc070e65261b55efb08461b04f6582ae38f43dc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58822f2aa7232a37dbc16ec5453d7f380b3e7c877c64fb0a70037d7f50b254a9 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.28.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..29a2d762c5e014c038fca94639409cd932366bf4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83102b64fbbf0585844b6690dd83f6958d7fce8f9e2dbe848dc4a2a3b0f9718d +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.28.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b3d9f453f7c875073e787ebafdb9681dfcae08c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7756d0f18fd2fa25f139359dc4980b5d4ff5540bf7268fddda57c7184a1dd7d6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.28.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4a52b9f9f23653cc4182d8384033cd0750ac527 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:606667aa6eb74458e3cc8e122077ad4725c4c58a19b754f2353d968a5e13001c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.28.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7728c33607f6ec485cc72e30337c92514775ca3a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3a8d4143554a8cbb30f8e6ccc232310cd427e2b9bdf184cb95fade6820ca7c9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.28.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e409467c080f475e3624b2a9b833f923e6e41e7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f6c491216d873f1afbabba8fe7ebac7b8f2ddfc07b4627ea7c9e437a12abf49 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c683f579e63f72c74979be568f2cb9d38c8cc4dc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e68b165345b33ad79d1cc5aaec633dba589411fae09051b77ea8b7ad33e09ec +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1aeab55ecfe423033d72cc9b4b2de6afbcbad7e1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4797ce1e5f6036c280e280990cf5af3e47009d55074daafc859350c7e9de4dbc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2572ea468d578d280a6ef5b6feea376e5c49e86 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3b0511ee5503efcf462735ae836cfbba5b63b3fb6c4b28e7f1fd2302154a5a9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fe15ef31316a2f6aa3f477885f797df6bb2ccde --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:615251326e78ee0984cc3c490db031d1a9782ab5fb6e85f9cbd1a5808333c85b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..30d05c2b43ffd07268881bb2d024dad607bacae3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b1f05a1a308686873a6ed2417dbdc2169a6f1c925d56de44693455246a1a63c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..50c8633cf16034f5e7cda7e934f6dffcd387ad7f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30fa6b4aae1a56e4a92b37175c61060ce5a66922984e87086959bbe74a345bf4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.29.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9071c03588aab181166e50b2d94a370f4deac205 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec85ca58eb80349c8b15f5966584ff4e14a57ee1303981ff131f9bfd954b5712 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.29.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c8522cced9f35b6585b43baa709df4a63056c56 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6dc867627daaa865e319bcb826d31967bbb93c106dfe1779401257491a3f72e3 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.29.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b311db9eeffc5980ffc4db08e25cb3171c7dfc0e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf15fb08b54a6ef79c85253308792f5d8ba9505b87e90108db466bb67b469b11 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.29.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..45ef88f1ace28e8f51d70e39a279fedd98ab70dd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:253e1ba94e5fc77944eb841ee03202031f89f602f6be89a2152f34f4bdf33c9b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.29.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..28deceb8fd674f47b1e53957a943ba968c5a2c90 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:caf67aa1e43424942e4eefcdab9c1198f698925e5941e1041e922cc098824b8e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.29.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b270774bb32ba6eb9c40519035ab516a8064352 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b8d12af9ae63c68354a28d2ea15eabbcbf1dd6784b4033960d5f3c4ecbe64e2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0afc2da3d36dfaa8a1d708e7b0624b377da8c8a7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b4e1711d9aca1fe2923a56b6c0411ebad55ffc1a4e03438c1a932e6ad4eff1f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..15017126603eb181612924f6f0d608ea449cd7a6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e50e11ed512c3b5c14b91e8d5560dc8bb19aca3bc6dc9a15ff9be77fc2da867 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..70e8cd4cc2f8e74f95dff2317d398bfac8e66112 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4a3d71ba364e4613df2cdce69bfc6f789249cbbd1deaf1c04ce83a4b1e51438 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a961276d490239c2a795e72e7ca0109cd998a40 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e3b73d8520dab051212c2f37a6a5f7463f469b110bd20f07a21c88860d5826c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d26aba2c7fe257afded904e1c8d5ec7f1d08b0f5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b01f5043d96cb5fcfbedd4e9c16183261be30e3ed76b0564dbea518319ba7a7c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d9cd753b04cc26fdc4e90326b0c9f6f803d1620 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0eac78736dbee437016b638b4097d93d4c92e8c657db149ad8bed7b676621d99 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.3.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..552947187b42ad933fa9ceb95726d9074a5bfc9e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52f26639649064e53f441c59b8bca32f94ac4f118df26406de9cce898b0fdf87 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.3.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f74704fdfd0c1525e6516f4ceaa5c66b3fd9be5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea7c7d2fdd16f5a360e7b73f3e7db5329b0c1b43fca220c83ac5a3476c95332f +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.3.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e9e3e1653f519c2fef2bfbcba6e51490ba1c80e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:196bf4d4113cb492d49442627615b9e664a7deaad713934b3f1022aaa2c00725 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.3.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0e08a24fd4054736efcf13f559ec2e035d99800 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ec5a460d8e316d35cf9f2a46aa64b37f6e0f2aedfee8f55509452ebb9677be0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.3.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7f5a5074c6a4bf45100603c47d3b53eafd0f71d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2905cc484e55e840f9314a36b2eae63ff8ef2eac29680c8ab8808cda8b1331ee +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.3.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3033d960a2bae01af30fd5c94554eaa5d69571dd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24190e347a88a2c5b39e9bda8cfda808243326e2afdb2138cddd83898da3adda +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..499670e6ce79ea20d2a7e101044aabc2c6aa8655 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:950175c7361d70fd7fa7894957e105791fbec1ebb899d84e3bd05ddb16c5469d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9eeb69df1bec05db083572cb3cab75b947c01c50 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c401a4bf9cb41b004880285d06601b4517bfd837be77df04ac1fcef9f37eb65 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd4e331b156084db55510c1f6a112040da422452 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce8688a99217718702b2937576075f7e580c01da6a4ef9ab7ef6b9b16767a68a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..40097f9c39a5f45dbd2faea3776ecdf79b3558a7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da5937d1030a5ccb4910543b9a99630df3d7b52cf804dee66de1289499479f32 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..39da1dedf718970f25c886dd7795e0978206712a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c717171ba54dcc84dc730a1fed61b80533eaf38359ae941c3caef45be004b4a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ddd1e9289a980feec0e082133490c28305717d47 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc75844d8d00b8c9e41fb81bfc22964a7f90c15f3e3c6f25cef9aa7bbda94e86 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.30.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b38fbbbc7a69811ebef887535c8cdf2bba27db71 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3213dea7e5d67131fd79765d238219e32328a3d852bc3ec4d62686bbc5a5b866 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.30.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5585e326e5aab5c24e82965d6d096a77f277435 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7aad19d5c718b4699ca86e3537272fb1eeaebe2a545bbcb5efb069805180f810 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.30.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f6a6c0d760712f170f8fb90de1702bc5eb1bd58 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c46857db231b382190e5adaff61ce711ae856d73491b0053909e66fa6c9e0e8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.30.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..094d9ffed145b615d1618713c30f8cb8e99f3424 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d45d213897678a80111b99bed6200ca41dd7e0be0472bc497ddebedb10386a3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.30.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c8be1e68985dfb88fe8cfaec669b878713477f3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c99fb28d8c86721fc9aec83496cbe746644bc0b29a8527f0e398fb840142b11 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.30.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8871e34b52efc4d5eae05f4b7827e7a8fa9a8b11 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b2a3ca477271275bee1e6b2a2961490a3ac6245d517990210dd6a35e088f023 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..02391d6ad83f0a3774d0d7b55380a2346cb60628 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eba747fc6cfef3d1d76c4e480773e457b4502e8658171994556222516c237b6d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6aa1f02cd86ffb1f582446a323abf51d82e9e7e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:624fa5375d55d035a82ff41e69091fe5d22001e973b09a3f34fffc1e81bd7d2c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a70207ca20783b1bb45bae22d5421b8f5f961e77 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8295080d7b613efa1ce3435d4757a80c76d1266b30ad5c59f9871d19b7754a4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3280429d3507d9dae56d90c75bf56cafa43de160 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cae1d065c3f51005d284da8189be1fdbb750951acc629213a5b2c4dac8fba340 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e76a910a51f43d541a3ddb7cb4091de172dbaaf7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8499a3a4da973a4f1305d71c01e97589fa120f0221b18771f6e9f52b0119f4f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..20058bdabab0728973ad208d172cf1cf56722b6d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f871f3c2cbd5145236fe96618ab8cd2f763bbd0a53e09504439bbd42a5b5098 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.31.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6a123e64630256dacbbaba618726b674932655d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6c14074f0a3c283795508d4a6c212d39abc85fd79f395fefc6d04e6b8e4126b +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.31.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5d480a494b548724a53b96f7f4b9a38e2854735 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8706cc0c992ff5c9e13ab16ed4849a8c82f734ee1058a5793da0239ba93380f +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.31.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..acdd6d338913066a06dec40c71240dadf9838bac --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3007ecc82dd1ee0e9be56de2c5474d93f64ccc55c5ef8a2e99c8008240745075 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.31.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..12c4665efee8c2699c06beec3fb948890556441c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f92faecf5b61d376b1b855974717962db7d4cd7622127aca40b055834112aced +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.31.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9555cf2865194641b65e0c1a853fd550a8991d39 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98403a3eedff799fef66a64c32e2e2f50b800a5a3754e74af619ba57b699ed1d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.31.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b25dfc4b56538b2d49de45559581489063000dc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0882a5b8c763be51a264177395ec6a876d25a16e4229cd1a713fb22549f2728 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1545f2972e541b0a2951b0062af23db64c99545a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c123f58224a7016c69f5e600e9fc56d3c4e45b495b1ad1d50573a35b63c450c1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..08aea09060d2e3633707f860a287960286a91507 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2882dbd93f0c0547afe32231703155823432c02bafbbfe9ff2eee67498b62f84 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe240bd5b36189d7f843e2a494d3a6f1f2a94f6f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b23043d736aca5efcfd1308f834f49df2d2cd4aa09e7fe6df767333a8b262adc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1c5f4d45695e974bfd3f08e40768d747b1db1b0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:328140668864f7a116e3c20b8bc016e4d0ee208bfda0a41861fd27efcdfbc747 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..181dc7d93251c5268d11dbcf5e23fa840496bcee --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c66e9b54fb738a71096bec3d5887ab985e34f1da96b4d3e2bdc8c32b71cf701d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..71849c048f23f6925900644d8c148a8894a963fe --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bc60a5eb35008301ae5448b5518ff74eabb3ed7213eaa56f00a5762b34198ca +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.4.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0d91c4140f8bd7b2844a18ed26b6e24859eeca4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d09fa567bc6645da843cb7a77943a51615aee6cce258e8bea78780770127782e +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.4.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a3e56c3cfe474546a4ace6d46cd28b266b95cff --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ae62681a0dc552ab1ca1c2954679526912e0a501f4dc377257e35ecb5027d16 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.4.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..77c3b087791fff6830cdb4e6e333daecbedf4052 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae93fbadf3ae13046e66b0379754d84a03d358f9c60426a4a38b81e1acd626e7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.4.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1e2a40a043dbf61949ab1b100650dcb8e22e91c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de415b0e8da66ce7fc2444d348f8deebdbc40e71863797eb5abb5a3372959257 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.4.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32992fd8fbc9364eb95a16d76c83d19c2447361b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81f47245a67452b6ee1fb3e1025103089c024befa716497333b2528018d77c9d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.4.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..54976e1685e4810741ae2fc81bb76c1deed06000 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e867f58be8e7740979fcfe68cb0945e13f7b7a6803fa178210c217b10717ce4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a900505515dc5b96e15696f1be360f8350b4e6be --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e52b5a347b8a799da05a3bdb2ce060d981731df3148468bbfbf9015c76320840 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a066afc1956afbb5d71e1c965fc09156c34b136d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:097ec861236b231feaa79cce62d420601e3311a23e53425234f4be8b32b7f221 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..00fc9add3e697ac3e20ed58f5f3c9a05f2cf259f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6438c585956a3d2d02c35fce19a1d434fad467785fd5dc3a777d46a53d196a35 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0515de9c5a1d278721e3f049f24943da271741ca --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a926e3d7b21939552c789d238c0641bf50ed5389e61e540457d0f90c5e989d82 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b56be9200706c09d929ce39a26e0582e6422bc6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ef1872ebde5a91c9a4c9d9b493af591b43d84a32a9c759de3182838f07bc473 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb8f1fd896a882d969203f0902eb4304db4d2fe6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7888636c38bf78438df29ccbcfef6976b089df2f73f58a0eb585bc6336faa40 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.5.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e27d6b7a724180b2848dbcdab694400aee5301da --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:708bb1c80f56b579fc32b5c3151ba91defbeb9b32d4265d38321143dc5b87f59 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.5.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8acb13d5bc50c0b1c0bf2c34d209d28fbd281ab --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17ea5cf2c1c15e690d30f84bae94c3a76cf12706c1c837428320285e799ba569 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.5.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e2bf3284e606e406f183275642e95a647928409 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:def504d2c565f38653e5a05859a83bbf95ec6fa3698f5ba15a7da2c78a32063b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.5.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d19abef369d4285294fdac7cb335093313213ecf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:070c21b995538913d1441382520e8878013026f1c115a18bdcdc41743fe845f8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.5.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f6af9e4ada3486097fe8b0338169c1db2c87ecb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7279888e6136d72ba94ee8cef6bb6576147b5038a4b7a6632b70564915e7823 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.5.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5278cf81bec3c21871f19e37d545d4ffd853dc18 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab3e7b446c1dcb05ac5c6efea90ceef7a88b1e0e05a59809cd05d3ee27b48899 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f55f7d72f3cfeec72bfa2e9ea23426b8c3ce08f8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25964b64a797d384eb0a23801d9efe55091157d8c18a039892fcd4748cb9349b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebd86c041e8969dbc51baf463eabf48e8e819e6f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a758764c98815de4f48df91512032761495fd3389544a6b3031b435cf0936d5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..38bfd369eab9b211724091649f2557d58469b530 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ede7546415df2d2e4b7996328b6eb338b5b5c220414e357de705739a63d88d69 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e00f1503265fa92a9b6472a017d1fe44cb75ce2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a9b4c9506652f00c97905de2a3e99719e8b2d06f1fc4ab7381bbac3793775b1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2decaecbb908ec35d8f2dc93106ff902c6c5d2d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3177c7e9a3111e17a6634d0b55406c68e949da1f9b2590c7e36ce10208b64b65 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7baea18afd05b6721e200906c0771b17981a28d6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9fa20d9562a7adedc4ea8a260dd58a00382680248599809d88fabdcfd2cb06d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.6.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..03078ab3883db7a07419d07780109a9a69b75efa --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f543688a6cb7bbc14897bc780b3dd3f27fa5ee30af26a2518fb9ef9ad6ae3c95 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.6.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fea3a984590ae684ac0fc09eb55addab5729d078 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05c60bcceba111b76ffd39add28df23536aef58900fc8ab734db0d26eef64826 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.6.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cfee17564d539c66da53de9e1b0458a15315d1a9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6e4aa01295fc5fc0126cf563ece4dc2ab185d3f21fd32ac43cd6e11532815d0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.6.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..89c3aa013614d29ef0404482a8aa0209da001a49 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc859e4cb628f82ecece58e4b7020cf14f1cf202cedfda547815c6d96636e835 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.6.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..846c8ed27c290250d6af647fae7ee9bb8ee7820b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f876aa5b98ffeb5c9e4b61ee5237474dc1d6f8099ad1d798428cf74ca445c4a5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.6.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..26339768d4afd911050bd4b0bb78a1e3c2db7796 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1c11432091fd44f5d974298c59918751199f5d001ac51ad0eb056c0a9934c0a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..699e1378eca1be924a26c16e1c1c0df17454ad99 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba003012b94a2e0618382ae1748fbf824b694307b1bead0b4d92cc760c13a508 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..89eb6393780e1313086793bb5028ecec9d87cc12 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c87ff5ad55691504506e8761245c7e28b1d5e936439ea4bddc07a6081ba914f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9634b3396c63b41931deba8f0ce827e55174cfd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be573b562ed8b0133de5e1ee6a083bde6ff05e147ef1f8825d91f95db3f4e58f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b47fca00b5049a3374c4c6352c0aebd31e0d542 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27b931efdbf5d628a30d1e984b77e72e315ac44911295880408762f02022efa1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6713dcbe24488bafc60e52e7b532b69db7b2a026 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f00af94caa1cb09d21f62a14bbd04fdc4bd3809133c6e2acffb0d2bba90eba62 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ae0691674e38be950b500fa1b857eb9d7ccad88 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae3d62f9403f0ac4c4ef860c6a6ae56efec5096ad9fe1f4eb042e57ad5ef9410 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.7.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd5065dbeab1ebe3bbc02fc1863577bc4b1319dc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6768846417353ceb0c3d3aa223339b63c86182f2c336d695f4a3ea53ef4e62c2 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.7.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a02a494de105e2ac61b4ae2d29401d2d24a40bfb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f211bd1139ff402a03596409e9f1e19751715f598b514a9b1704552a60600573 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.7.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c31967d9a6d57a63d7aece9321a4c92fa1d4f8fe --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:594396b7d7a6d7a313d1089cc0c517f882974bba5ac4fa7707931d3a6dd36182 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.7.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0ad3f81b09a9320a207947c920c9a14ceb731cf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:744c10214d072c38e91b2bf20517ba0da87c3fc59370f36926f79866cda4ab7f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.7.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1fb0f34d6567e97ef80a9bc9e30c2c858dcc0e36 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9d0ca1a7922ce0a8e295b76157af79c5254c56557996c49a58404ddc1731d08 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.7.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..776e23253bf7f16b1b9672e7bb7c4e38f2f33e6c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e344d6bfc6f58bda1be19ebaa04ebd066b85925c44ab6ef66ec46f39f67b26b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a94b1614fbfa598b9737bb28bc4fc6b3f23f3d35 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:914d8b082cbed8fe3c3a9079596c10a54574ce11a720cd59660ab3e83c511a7d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..43eb37e3d8af25c7f6fd4a898ea89167a72deaca --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21b83fb41d572998481fabec2eb94a1d0d23e4f058c89ff6fc015044c6c8559b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc9e90535fa65158eadb8c52f4dc5346aec7a5e0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c87f9e2bfaa800ac4abb92fe1b0ae8b1fda3124a9d787d526cff20c9ced8b9ac +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5bdf1ec4d6f45d3c7f70b07366b70ea6fd89c3a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4614c43d299241d658d7b08114d4d7747454f5c5e07b70942b574f17a0c30b1d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a55070b31b9d490b6c7a0ae23659681e8bd58287 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6aaf729e8285406cd5c36699839d74b136c48ce3bb0a221ffeb39d594bdc3e3c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..73017b89d98ea0f990ef8552c08927998e01847f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24e966f57746a75dc8cc69d74fe7c8bc13e582882a8fb03c8cc4c0b6ff7078ab +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.8.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3c74ddde1f37127da00bd0f1157b3bd8649cc2d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccecbe6693d525e98d6ce6e565ba441aa3b00c215396be1aefd56f1b8422c3ba +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.8.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5b85c994e038f883c623d855b5c6415856ebe1b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6ffc3612ea1fd3039c804418e73e3ce01f17db7f315109f84717a6dd21e6e83 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.8.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd423b4796bd9e201011612a971fac56a1694de7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e7c7ce6ba0a6186c314d495c04fe7736f8fd96c0a9b499eeee29b0c9731689d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.8.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a695a842ff013655cccb41c259b109f1b2070f18 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84b69a78c904fe8b10c6f861c6fdd1dd009ca91d18acc34fc8161994c3193d9f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.8.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb6de5ac6a0955b19461b13c6a5556d72f64c1e2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd49218fac58609fc613acb8f1e2a791ff873b4d997afad3311dcd6f15f32aec +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.8.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5159182195050f5c25c75bf1ba8e39b4e500cbf6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9889fd4c9638bc20ebde1620fe03d4e72bf177bf2d4be005f8aed19305f21e6d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed05b52653db376b2871ee96fdea9fbfc1259b3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c80008a0fb3197355dcf62f92cac8d847cbd2dc8251986584a314a3b4b3ea83 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ae944a18b6dcc0b3928df909a2bb74543331dc2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:025d2f3db71304d260f9d368e3c5470e51f6bf154790a682b5da45b57d672607 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8cab2254b4ce2a2c2e77a8aa797a8eccc5ad1bd3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3372f86e68fd3ce414dae71dbfe2c0c14a5b188e150049e4237487894e637fa +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e02625408a766326bb5e4753a347b07d29b7b6c5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ea148bcc3cc746ccaf924f52d560b96a8a43e1508f59e81b974260f78dd3930 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad6f49e646a0ff0d434c72d0f81bdeb7b2b40a1a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd2d416bd965ee56ebac12145c26a1fdf7499ef38c09eb4a1532f90053ee57d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f1d03f49951e0c842fc0b7d35b156fcb46f8eca --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:498ddde2c076ba7c08dca2be61d031a274919a3cb0a3701c41afb651f77409c9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.9.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8dae16d0026e0f5dfdaaf6d6570de2bcc18ee02d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca89c098718ffb26a4251842e7c3669b38c8dab68e576124647be3b62755a917 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.9.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..30c2a096c9120285265d0ca0e69bfb04ffa38853 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b0e6f598c87fdc9038fe40c1b9130cf8434e8cc262f2bbd68feea9b102fa20b +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.9.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7b0581ceefa40df14f04386893911b73f00b70d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e7e55fd1491a96289ee6cd2df3c1c74ca8c6348cf592fa6208200037eb05c7f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.9.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..82a655e6da4be36bc2528e94dde2fbb2b6e5d3ec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ed90f4c49f76f645f312d5076853fd9c08600d2cbbeb19440c82e96cc382d3b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.9.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..48bba26c79878cb3df4b225aa5eae9983005b3e6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69ed0b007e1423e8bd281693a3f76ffe6ad4463ba0a92805de7168c1373ea121 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.9.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..92bc3388f3f1a065f469c175716878d72fda3bac --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2b03086dfba360b8ebfa69e0325482aca3d2ef2347daccc314acba2fd6bcd5e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad4cf2e8360ceb483965ddce776f5f993fea8002 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3ff7ee002d3854814071057310e75783d6d7dc1e37c52ddb7347050e996c2d1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..508bab1c1edd417a112a74f66361182e31c9d3bb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ca190420c76679775974546e2fe6cc190894f2e433fa48d7977eb7b1156d521 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a63fcd712ff2d146ea479ba2ddc95afc181229d5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be319320e15f3b8794b8c24ffe257951fae6c26692c53aacdb08c20738ae6760 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ddf2efe7b36e8a11a32599babe313bad9df064b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bc50003f67831533559de41ccf3246c37c3acf451c86de6309465491765b619 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..51ad2a33a046364d577629be8918204dacaaa3e8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2228de401f883c6e796c50a1d323f6692c4eb9a04c4ccce44f3665705fa27ad6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1b6efb0a97ce49f38c69a6f5ddba311aaf7dcab --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_7/trained/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e24c27284e167110409a7c73f37c4c27172faa4896f5c61b190bbcfcf4025dd +size 11395