diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/lm_head/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e09f5d5fe2000e8c89014cd19c97cd7cb130e751 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:904758a154c98c640001f446d4c1090c3d467c6c0f2cf531137e85c98eb016d1 +size 205955 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/lm_head/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..25e9f1b3297c6e05bdabafa400a054ac173786b2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a58194e28d6554db10edb6ff5e0f5537f1c4eb7fa9c9faada7e302ab91ac9c40 +size 205955 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f878581ce5ce8d5f76299354e08e0e481d9b9ca8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee1381305e81de94ab396b27da4295667a403d16d85883135bd34d021e0c83f9 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3ef3d32f9ef6ae31d75de9d518c1019d7c600d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:763b01065191c395a0c258be2c39e01ddc714e002fd915fffab7b52d5ac3cf65 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..506a53d471a005788ff7aa14cae6a24f8dfe48a9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f416bc773be74ae9c440b8cb04f0aee2a6ad6670d946fe388c5322daa25c9f3d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a60ac7d72081febbe10cfd2bb8ea601fdc3a692c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b5065cf306017afed3a60bea224899419fcb29eff9f5aa987ef204eb529589e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..288d48e428c59614a1eb896ba9039cd3f46a0ffa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c11cc15267c7049fb4385ea0e0d29aa8b749131ec34dcbd17840617e04050bb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ef91e1259ac424af317f3cbd598b5fbb60d7bfe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e159ab50e181f0ac7af9682d8d39115a1f2171e783678dfa3bee2393528d447 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6bcdf3d4267b6bb83f18abdfa318a27528df043f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c1dc0fdeab6de176966bcc6cd137a91c38c2c072fbf6914c6b7a64c06a178d8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6268598cdc3c73463bc4092c3148c4ac69a2d268 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f34bb0dec05bdb2524555ff2aa5eafbbeb4b76d53de90b5783eee0f50786909d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3ef3d32f9ef6ae31d75de9d518c1019d7c600d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:763b01065191c395a0c258be2c39e01ddc714e002fd915fffab7b52d5ac3cf65 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..01a547c034e0be629dd88dabefd2fad0d7199ea2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f62bfec4833f3d5265fc174f6947c437d3e46950945734d4207c4b9910bbacba +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..90e64399052163ba5048a529d947998a627449b8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cf1f1f7b5db34613dd59344bc2f6a418c9f8ee72bddbfef9313765e0911536b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ddfa5001b70c0acc666d1f065c37301e3083fa5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:145017d0622c6a6009b2c49402a7cb7c62fb06e97cc08bf58a7fddf27bf39e6e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..26fdf1bc4117e300da9531b8dea4c061e5fe9c28 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e50671479105857ac64e90eb67406882446b96c2eb1c850b443fad64d40c7906 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb3377ab425c489824d3b99f41db65fe25f7e42a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2c955259ac4ee2a3e63fe898ffb6619141a83193e3f15d748b1010c826ad50a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d8b94c1874c5156d72fbbec6f0cb5eddd8b0ef7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d880633cea9780c4e812fc141b856f7bda15f5688fc700fa57815fff38e8b92 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..249483b7b4ef3b6680c91c26378c27ecd88da002 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:703a50ab399b118977dcfd3973e9594df90e456ad7bbc520e7d3d56e76ccb570 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3ef3d32f9ef6ae31d75de9d518c1019d7c600d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:763b01065191c395a0c258be2c39e01ddc714e002fd915fffab7b52d5ac3cf65 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..df6b9a788a95ba95859113e53c3ed597fde20622 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff472ebecd1d9252987005f3d7b5ff669f3b5696c8f8a06ef6159088f7174d4f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..10cc8d506a798f62a6fb01e6f303119b959fabc3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2484cf56a27ed18e3e48bffd3910abc611ad959684f61fd59df0b2efdf4c8b6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..214323c6d17322b319d97a851cb09ffdf601c703 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d1e56262431eda3719185a252d8e868ca336a2b489301b18e44483ecc9aa467 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..926470c4782de062571cb8c53f5e0ec213268b6a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:056e2a5cccc57414f20a22b8f9329b21e23cdca9ff1edc4995ddb6f72733ceec +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..445b6a3c5c3000946d375765346fc905879d4128 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d9d6d5297ce75214d6a2418a4f6ac449c842b64578c092665ac77b3510b184f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..57108a77a61cbf6d2bd623d5742f1bd73605ae61 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7ee999bfa9cebb18fb38d2564b3c41fd46644ab59361f6c0e007bef2baf8c2a +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3ef3d32f9ef6ae31d75de9d518c1019d7c600d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:763b01065191c395a0c258be2c39e01ddc714e002fd915fffab7b52d5ac3cf65 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..54a16b0a23853174e46d643a1b9e967135fdeb37 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7deb221504fc1b98a2a401237d29500aff2c8eea1b2cd5827de57c9680a42014 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..53bbdf228a7ea2b724f1908507f15168ecd07803 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d2855c8e360729c825ed74dc9c8b09230f654d0b8e387e83a7b11879042a395 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1995723e4228cb300ec777df1b32b323f364ce66 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0487574ae995bf7b46f9bd88d2041ae0f09e6f459652d2bec8dd747ad1f1e05 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..179b7702bba95949953bc3047fd1787d868c66d7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34380eca8bb0bb97fe2c0b1b19343d6fe169138ed9933f9bae883a47e80292d4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2929e40d4c11a69ff90a4fa10b51c85449a70fd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1496fe8fb9f1bee89f1a5605bd9798c09c3a685f00c6375bf8b844bc982c33b5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.12.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb363a7065e607a2e4c29f5ad8afacc3466f50b5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06c28ee33ee31e72f4f19591228216044c78c8ac8ed0ecb5acfc621e16c0fcc7 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.12.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3ef3d32f9ef6ae31d75de9d518c1019d7c600d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:763b01065191c395a0c258be2c39e01ddc714e002fd915fffab7b52d5ac3cf65 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.12.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f2e523c7c245bc9eeaa259419a190c0f9320b5e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:651c02cd95e7958415a10fc9161f5b10db7007f923433122af0874ff549305ed +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.12.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0096b84dec9d59ba516d7a62942bd05dad55b08e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59743378391e00ba13f5b30aed88ddf0fcbd883e3f709551cca333564c6336ef +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..592804db564c109026b3376c436af6da96c3ae4b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca480b76df21e7f5f650efb1008fedc3328a0ca811a9dbc910677e0f294e0e13 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..86c756b3d14304b41375df01d2a5d59ca08a933d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d7349deaf07f589690dc8964467efe8aad7c24836716b68f4410ece4d9c5512 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..17378deb99a9a0ee3fab1019c2dfdfa7a44a9cdb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8ad16bcff3e99c12ff7188c998aa8ce60f309c52962fb3ae152b8d6663e3067 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.13.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9171252b4a6e12988386140aa71d4164a26b538f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a9d5bd9b9a07315f7b62274939c66dffc9cd0ef3239ab988911c862d644424d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.13.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3ef3d32f9ef6ae31d75de9d518c1019d7c600d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:763b01065191c395a0c258be2c39e01ddc714e002fd915fffab7b52d5ac3cf65 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.13.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..693e2dee13f7525c7b6701f1c86281b4d1dde436 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:651b78fde3774d273576f1714a75c19758c9fa2f2257ebc326dbe59ad03ed4a9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.13.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..527cfbac28a318bda0f936480b1e70b3aedd6d3e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31c69408d1c2bb4d71a6826745b6e2953113cd3eedc1776d2840fc2aed8afcc5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8655c23598686aef2a0cad69f06c21cb87197ae3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8005d0a4715e4e11173f79922808f50608ceea52c1ee4f672f46d2653dcbf51e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5190b657e0544950bbdcf0e860318f93fc08eb75 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da658271e5cc7ccd528cb0100907adf6237b3e4fc3a6934d13dcf0f1664a7cfe +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0dde69fe2d146a6955b3946c4843d5736c9fb5cc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ba62573eac08a5ee31d32ec5b1bcac227dabb4d6e559d08e73e57f73af1e0b9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.14.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7635850882fe507399b44c9ca6195d796ad31b8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a15e349caea4adf2668b19ad8f1b4dd889cea87f51b608514af8339e8e68d9b +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.14.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3ef3d32f9ef6ae31d75de9d518c1019d7c600d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:763b01065191c395a0c258be2c39e01ddc714e002fd915fffab7b52d5ac3cf65 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.14.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f603cc7443dedbb08d39a18de54301aff0c41e2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7959fe20a617b96fe5d11eb4fa5cf9697e51554198c644f8362fdebcdf73ab9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.14.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3e493b9830eb3268292f3b2c1d33660b4e090ec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dfa44defe82435d46da031b78801389c3cad82e47146a8121160f42d157f9c6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1c0ae7f8ce58bebecd7d344add94b8146d8afe0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67e088da9350a6ffa04d45a931d0eb6db62c2e46980d3402cf2a199756052d2f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1930866eaa41a9eef4f9ddab30360ec219dfa16 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d50c3b67d89e27b5610f97edcdb54877f1ca782715d62ae2d1c63d4a9380306 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e476e79cb5a8e37509525557facd2feb370dd0ff --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d8b0cd97a21a688f531b395baffb4a32920c1498d1bd2a68ecad1e35d085922 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.15.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..075f4cbb3bb682a634b1184c3f5220cee88405cc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec14c240149fbf84de52c501e59d59e8a230fac089dc4e61ec0c6702c1191c09 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.15.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3ef3d32f9ef6ae31d75de9d518c1019d7c600d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:763b01065191c395a0c258be2c39e01ddc714e002fd915fffab7b52d5ac3cf65 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.15.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5bb71dbdf39c7ef07d93b63478ad9841cabf3fc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51f8f16f840dd460e5836d29b44a556a21d41b624e24c87a5f66bdd4a67847e5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.15.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3253ac9571f3bf7d0616cad54acef172956f5bd5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d75f862b12243baf05396b744f37ac0064a73f609e64300b16ee830993881fc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..55ca1a7a9ed63bd6d9d9bcec76738dbea2312207 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87c91825def4382b5ac8677e642af8755c98e1ba27db7e8b10550a0e71b6dc8e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1dc7eb2958f0adb50ce2bc13fac4e9391a609748 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:409fe26a59af9007533c289f7d332051d10a99f52e8ac4223f4e99b47a9764ba +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6ed831628ceefb2c2637265aa64c5afd5029f60 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a361d3408c032143fb8c76d3241c5d50c1f5db701938ebeb01e061b3e685655a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.16.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e3dfc70c8c3c73410e02ea214427eb64ba86a0c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c726f3e818f2ef3de78a9fe06470c9db5e0b5c8dc33dc27ba339ab373ed7a718 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.16.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3ef3d32f9ef6ae31d75de9d518c1019d7c600d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:763b01065191c395a0c258be2c39e01ddc714e002fd915fffab7b52d5ac3cf65 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.16.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..663e3104774a1592bc3538cca9f16a2bf9e81ac6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:275913ef05467be7915bf0edbe9428fe800a7490b0b4065d44824fc272c86eca +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.16.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a79c9f1fbe512e4d4360d100b597874edff7cc8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59691b768cf0c6abe800a021dbf7d5a61d292f0417c839c09c48da684410ce70 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7d031982c09e295847e30c67694f04998d1d0d3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17ae4f6dfbcb893e83bc0247fdba028937356e9bc4621f0948e27c1ec9fd64a7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4aaefb2073f0e22e394632b05ed705ee71fb7632 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:809926c8c088bbfb3f4690bcb838c5913eb3e67e9d3cbe2e96b66dac37ed7f3a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1324e70e8f8c8f1f52542733e517638b1e271198 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34bfed9879860a1e62179a4b90c9ad04757c9e55ea85a5da46412684ea0a495f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.17.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5895de3df648a7aa40e9f8163a3906369f3bfb58 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb135b17786049ac65acf67d5fb56f9558e60944084bdf1ace129a3b735dd256 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.17.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3ef3d32f9ef6ae31d75de9d518c1019d7c600d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:763b01065191c395a0c258be2c39e01ddc714e002fd915fffab7b52d5ac3cf65 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.17.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bff0c0ff3de3187ab428de61836f404a2a232cd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:467fa6b787d909113dc6e6dcadef60d29f9aeb5df5df70bfc70bbefec0341394 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.17.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..84a5287adc13746d70f563b48fcc81b2a17d028c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:604c2e6c62e7acca54f4d6c6726146f7e8be86d3f36777c6a627158a9eed41c7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b12d6a8e9f908a1ca52bdb2d543eb84ab8fb2b7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:326654ab615bae0ae9162e70e6de419d5dd92bf615b157687aa14fe7584d0ac5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f78e8ff257ddf81a7ba37d179834f6d0ca618b5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c799a7d9e3ed62f9018742831c7d67b36b12d61fb65ccee5f644f5538b375d3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..44a1ca3479d7579732b92a0db7a1d3825e69fd9f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e03cb9895ebf466c6dfddc39fb3df420620e48a15ccd9932c40e59c0ff4a3f87 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.18.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..30704dcc171250090d3a3723d93441cff8d1a23a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e321ed7fed2f70b5b6df87e2c683839b66772dbd2c5723f8f42d16df127749f3 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.18.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3ef3d32f9ef6ae31d75de9d518c1019d7c600d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:763b01065191c395a0c258be2c39e01ddc714e002fd915fffab7b52d5ac3cf65 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.18.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b857cc0a74194e29ff3028f08ffb4281796d9e5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:babf2369ad59476c8d4f662f079a32ef6fb5bf9c95341d08e1b5acfc7825506a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.18.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a934968cd704feb58e8af253941b8a7f43378f34 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbcff0b8121f497937128251c86555049ce85db3a3dfd4aff35d520f14f5a3ba +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ca29aa86c972745855b9a76bdb1f768d991a872 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24229970cdfbefb5b13861f66320813aa21901b4d3200f5a97af867d8912b654 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..89e8b63b83361f0d6c782a44e652586f79d88b85 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:637a8fc90d8b7a5b399ccad261f2082d36bc82ffb7622be6c24682936a1d6edc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8e66a3c202a2e8bed6fd7b847bd960fc63fee5f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18a9b6c05446b04a12250007f17b08fbb5372350300c3357e05f3233cb7e206d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.19.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e45a972fd73c6148468af6287184bef1c8471d57 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dea34e4e599eb5bb034e50559188d115eaf246cf576caab0d149eb116ce9c012 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.19.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3ef3d32f9ef6ae31d75de9d518c1019d7c600d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:763b01065191c395a0c258be2c39e01ddc714e002fd915fffab7b52d5ac3cf65 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.19.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5431bfd386201abc0232dc63be04c55ff0026df9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a0c24462b5b6de4ee6ffb4902cbf254a64be1dda2312f29bd633cf8ce3d1605 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.19.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bad2b0cdb308abd501d39d7371448fda7630f6b3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3fc3f6c7d342d35a307f4ce70569c78368af63c261392597fd554c3b9f0bde5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..73e88ccab147e2cabf5d613a640593348d81cf2b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b452d1e4b1fb29c699c7baa2c886a5522ccbbad52d9be7a856b8790ad13bf95c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2d7a6d2f13a45ff50ede47a9ecd0ca233611443 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70295e9e928a6738b3e8cb71b825d178701c96fca7e3ea306c6292611d325e73 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e714ff07d817ca7bab20048b23e241b9dcc93fb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fda0f58df3f641a8f2046f6aedafdd115de5151aae730f2e4116cadb3be89c08 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.2.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..06f2a599f152e79cc73079a58086abce8ed7ea0d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87eeb074cd255cd3881ff47f4d41f7b39ba52ed8c9c0154cb2def39cedc1bcb0 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.2.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3ef3d32f9ef6ae31d75de9d518c1019d7c600d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:763b01065191c395a0c258be2c39e01ddc714e002fd915fffab7b52d5ac3cf65 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.2.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.2.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c47d0a6607524858597ecf51d5d4c9f405969f6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4962d9ae24b942e8b52d01f77077c4dbb1238d7b66d19e402ec0c5d35b18be91 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..27ae7224d56c642fb01c8e9173f5a6d9896f4164 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbb149b82b0bb1ade5b4644ef74df5f6a80e03d86934c53602ef73be84b074a9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..247aa5bef3735ee75b7997b099ddf732319d294f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8efe762cb7ab442cee2d36af31a8db0a5c980c2fecea3d306d3ae8b4754d9599 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4e4b999ebf320bf5657537e46445e0f4d3b04c7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bb4bc60b6332a8d803382efa4eee121ae4608a8d352ca3543c5efd04cdbf19d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c4609a830780ad8e8b810c0ac81e4bae6acb4da --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6926eba6542817948ebd257e51b71c7fafe5dc31d6e28c3d3e83d246a95a4c58 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.20.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a1817a2bc8a297d9617dc431987b754e865ce2b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63d96f672cad63f06090610842354fe3b638e9941802e264ddfa667299e422c8 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.20.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3ef3d32f9ef6ae31d75de9d518c1019d7c600d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:763b01065191c395a0c258be2c39e01ddc714e002fd915fffab7b52d5ac3cf65 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.20.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1122d2e10d76f1337c9e25612d3f8a842549a9d0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:692292e754c2b054973a695d3dc6056265a7dda4aa69a88099409a8d50a525bb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.20.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc16ae5bc6b9e04133de7cff6758be0345d7b400 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:549705e5c77b09b942915fff1a4c83f995fbc2ad882735862841d678a870277b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f7ec12397b1d453bf1085514f373769751250bc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bec19418677be7106e81344ee1780a7da9a6201648ca88bef44aa8f4c549aed0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..785dabaf97624cf4cc1a87780a79eba12508b61f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a1e20d91678f35d9ae580e6bc8ccb55ad3d6d85707185c753c17c7d55d65277 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac02bdbd624f7233ed4cb2dfd96b376e2f131bfe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e37b0b8b145c80f86a98cb5c9981dee4dac86ab97cf37ddb8289809dbbd79ccb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.21.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c7d7c8e5dab9ff86db1dfcaefb3d62c4d5e5e09 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a36ecbeb805a953d01647f155dd0d1cd8368efff64354e02b42a99f08796636e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.21.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3ef3d32f9ef6ae31d75de9d518c1019d7c600d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:763b01065191c395a0c258be2c39e01ddc714e002fd915fffab7b52d5ac3cf65 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.21.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..17ea5cd34191fe511853f72885e96acaa8f9ecea --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a967d58ec00c6ecd8c622a03e2b4b6a56260aa3dbf4a92990ea0bccda6e543ea +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.21.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1612c141ad6089a90029853fc2f2f934c532b06 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83dd6312c6ccb5cf5868a2b839e623663cf889df06ffdca012399041e9d9a8c2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..63c1373eebf365f7099cdcdee28b244a622cf998 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f8111f3e4d6c2cf48ac4f45041e1a9b37756ce1b6aa71acd7cdd7df4efe7b92 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..48946001fc729348217a83bb50a03e37a342c059 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e32204f0738e3f2c73a424e6db059fcdbaf4218850b6b962dc3254fd5f9ebbe4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6cc6ed394035037f82387f735df91e8b7df6031e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94dd438434ebae863d1121426cf5f81655e10ad8950bdd7215ebf9f851859cb1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.22.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd65d9de32dd353bdfb9ed2215c588b3abf54740 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:443a2d30924e251ae8a83b93c7e9c37e7587a9475abfbb73836cd9a341e25985 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.22.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3ef3d32f9ef6ae31d75de9d518c1019d7c600d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:763b01065191c395a0c258be2c39e01ddc714e002fd915fffab7b52d5ac3cf65 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.22.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d172749c9c66e5cdcda8451555672197b18b5235 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4b3bfd36e76f039d9a5a2bf4358d89007b2631c8391cdf63dcf997d1fd2d6e7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.22.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..19ea0a9e11d66d849d8fd34b735aa1d42c4c6df1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21380bca6566f78524424c0595b7626d08a1b0d7bc8b1392712a3bfbc98bbdfa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..114238ee54ee22769ca3b5b0c5800ef9233d2cec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19e247e0be97cdc529a98e48231c09774de475a381a101b22fbb702a14897103 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2baf60ee73f831fd68412c4598cd9c7b31aa23d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd43eec8ce606b2978338a319112348277dccc8dabba6f9bdefb8473bf934263 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..69d426498838ee3009771eb3e4563dc4708cc229 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c75612548640cc9772dcbe580208be49bcf0613f5c07cff0648f3b9cfb03720 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.23.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca99e56e33c277d102775384f35787ed2961c637 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd7ca59d75807f151cbbcf225544c4a8f6ae4b8d22d78b3262e31d95326b6664 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.23.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3ef3d32f9ef6ae31d75de9d518c1019d7c600d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:763b01065191c395a0c258be2c39e01ddc714e002fd915fffab7b52d5ac3cf65 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.23.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdd4817c8633f68be29410846388b9258cf911d4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9d2435378192fda74d4a410459abf8fd6a509525afa5a0ef02ea1fa010b8a64 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.23.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..53c50fd4375a9cd588457674feff56e01dc4bb55 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1e858843d7ec4c54ea592c74754b5962a3ce16d669287befcd446b921993549 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4cd4dd4ac73205bb477fdb17caf48bbd4c96ecfc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f56c6df02c91c9bd6e42e09802129ac883a193508cc7f4386f98d5acaf39bdd8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f6c946f18b8ae578306801a87a1e8d081b553af --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10f0065e6acc19126137104ab3e2eb45c02b4f2411c1c24c185fd80ac95816ad +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a779a4ad7d34735d4573b7858059873b22ec093d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b55018b593e39ac6610497eb077dc9bc0fd4b7e7aebbea32d8a2275f447d9f4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.24.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d171fa13d18eb313e67a6371c7c263062b8aeb5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1957604e0b00d6f7d7d5382e4163f78340601d69941699ebc0d884d63d620f66 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.24.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3ef3d32f9ef6ae31d75de9d518c1019d7c600d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:763b01065191c395a0c258be2c39e01ddc714e002fd915fffab7b52d5ac3cf65 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.24.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e816262a03eb9cac586437cd15fed89ac0007295 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dcce2964fc3458abe9af858c4dacb0f179ce6ccc62eab1053bcb666b608d74d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.24.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..90177e0391b1b3ec8ff24a4cd1feea1176bbeb49 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37d833bea69bb59e907209d0dc0c6f23f4df89f13d60ac86a120c86a26078f99 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b92fb67cc05e1b5bd6f2537c867c903bbe1b5639 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e80ba230e2069e2a88ed8fe4ba60a70fad9c706192d4b2fad1d836ca46a3d8f1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..668bcca0d3e5bea4d3ce814bb53b1ae77667e8e7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e89ed81e94ac05b016cfa14ec947e210f53388e459f70e26f1cfad648a63ab1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1488cbfc1a13391f299eecd5afe8bf8dbcf64e79 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c206c87bfb3de1a9a8da1c8e596505fd4cd144f4d75391fa6349d746a6a28af5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.25.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..af9e224bb1d7a2aaed2249dcde856ca9f5c817f2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10b80b3710fa3e2c447f08674b2e2946488d12babf3192126dd113bd60d9a93a +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.25.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3ef3d32f9ef6ae31d75de9d518c1019d7c600d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:763b01065191c395a0c258be2c39e01ddc714e002fd915fffab7b52d5ac3cf65 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.25.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f84532201dd904eb402740e1081c8e0cdd505eb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86ffa445fb69061be3c7f7b88e7fbfa80ae28db3965a32e377fb8ab2663bf827 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.25.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d989a471eb4a2a74a4ba3237b97e3c7d241451a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3424a451bf7ef059180c253295a753830e4b3c1c3ebd886b00488d1fe1ffe710 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bba32c92df7a20ea7ea7a87025f4119ab352fad8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65f7fff3adab788f7ccb15915208ee64dec778a8d6e4c0ae9069c3ba6465335b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0578d5075c87f87ab27bf28a3f44f44958b6f249 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6565b4145765c16570ce56bc59f0cd821f20f48a7c5f57b97fcefa8cfaf9aff +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccbfa0be689432836043b4e8f04b11e21c244432 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e03c98e540529807ed12e2b2ed75f543515d9643123ff4a8f870dd1d1ee09122 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.26.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad3f5224b70f746c3b2871d08e15a572f33dc409 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc8329531a2192c20417420c9c05bc0616efd89f05d50d7e58bff08162e30a0d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.26.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3ef3d32f9ef6ae31d75de9d518c1019d7c600d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:763b01065191c395a0c258be2c39e01ddc714e002fd915fffab7b52d5ac3cf65 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.26.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..db53a56c2598360bf67f09a7386e38c2aea6a542 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3d6eb4e1d8cf401cc1899be03ce3fe904a584240eec5f857fafa6fa5a36ac6e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.26.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c80502adfd5160d502448b44768c2eaea0e16a1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3fddb8e61cd794870f28409bffdc1656da230bd8a9396ccaed8d22ed8608b19 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..78c0f14785e1549e695bb7f4190f12eeeeadba51 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03fcb80b7318e750797c74fb8fd3a84c4dbfda4fbbc6cde1a239095ecc79a3a7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c96f2b866f803bc52e478ddc99a8579db04d77e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec7e28ff658a4f0f3be13356fbec0654c230819f94c29864dd0a1f46da44fa42 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d37fcfd1fee604c55fbf8734035678eadc796ea5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1d97720ed4d6fd18f0fb116898f1c21448d885cdd2afcfb25de5925494e5a44 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.27.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce33c1b8041842281c11e20a266e8a2f8a8f0df1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20b1f2c3ff4727dc8b69a0fa8f198c9e7ed4023c28d92f14444bc936268f99d3 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.27.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3ef3d32f9ef6ae31d75de9d518c1019d7c600d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:763b01065191c395a0c258be2c39e01ddc714e002fd915fffab7b52d5ac3cf65 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.27.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..68565e9f975b094d7a7d0677c357529178c571e1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e21bf87a95613437c41863db169693faa1f13ca895fa81967b30c609a3ae9857 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.27.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..16491481741cdd624c54de60f68a797016d15ff8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4188cc9b81d6a5e6cbd6c430a592efa57e6aa3d23125d4bdbaeb1202c1cab51 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1d77139b99f40b6bb845ffaee60a33d609257fd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f14652e12f54ce44419e6c59348bbd6d8e9f75166e3a49b35dac29658435cf50 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..81eebb6e9ce637b3a381a5a762a21785e3115a5e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa107d65b8d3a1bc1c139359e16dad1d589f2ec7f05e86cd865f1868d1f2a940 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1fb88752407a020354d28657e39e4b227166d91f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8f58072925716a0809b34179e32c5df37494895a0fc470a538884de89b33629 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.28.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..98035f5a0a7f345bd0d08229fb230cd390fdd83c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7836b7e41f87a9a2cf967ccf3e4fbb4c345412165bf5993f7e5c6abaf741ef3 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.28.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3ef3d32f9ef6ae31d75de9d518c1019d7c600d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:763b01065191c395a0c258be2c39e01ddc714e002fd915fffab7b52d5ac3cf65 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.28.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b51c69fac89b062368dcecbc0ef0100ee07ece5b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a3ebb4ffee92dfb79008672cbc451246c9a0d8e4e7d1586acd175d3f5c221cb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.28.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..96efab3c2116071726f497d6ef7a0263a0868cc7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c6fc4dea345018486c46fc97f8e1504d3cf9cffd53960989a003747b84b511d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8316e38544eb7befcea0048b9f03e3786cfb8797 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca9de7bb1265a2fbe47f0789809a21edd1802a1ccc38a673e64b3c030f3f602a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4932db5e76ca0a21b9809c4357379e19aa7eb785 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74a7bbd657135b5bf265bf82b97a22729976c1e050933f5ace8acb8aaea86f5e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c7566baecedb27e5b34ec6aa16979cc60642356 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d5780199cd25b03a6012484a5bef999f6f23cb218b97649c043896196284b6a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.29.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..86803bdc09ce5f3eb76f7ab4fed8cc5c2ef46647 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:667acccf4c5d10975b205fb83cd7722ef5e90de64e314223e099dfd6dc5f5562 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.29.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3ef3d32f9ef6ae31d75de9d518c1019d7c600d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:763b01065191c395a0c258be2c39e01ddc714e002fd915fffab7b52d5ac3cf65 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.29.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0afb1f06f15f6d52276a264826a4ca99a3b774cc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29e727b6c600efb1209692a414395d37af36bec1d2eba585c4776d023f802604 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.29.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c810a2d9e168c893c6af663a5847ef8c90fde5c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b2855d094104ba38ff6223941f32c47228888aef5a618bc11ba1133079912e9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3284f770d7a81a39b5e127b26325cc8831704a1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7604193dfeec0c3c1b2dd06eff1320388bc786ba5f00c6d3c9aca7366973d68f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..548591554e98fa9c82d811a6ff58bf8b3faa4607 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e5176c06134b2ecc89488e7ea22dbe427b66a6cfb11625f293ec4de56d872df +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc20c5015196df5591c649bc2b7b09c811e580d4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f955721ed856bb95454f4951dfca8fc78078027239680007c11eaa5bc0c66b16 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.3.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e7cc3df7add9a80077d305de9841fbde4b952f6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01ab1b947539c2e8244cf3063f21d3e1130076ceb827c8f48749e82657909f0e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.3.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3ef3d32f9ef6ae31d75de9d518c1019d7c600d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:763b01065191c395a0c258be2c39e01ddc714e002fd915fffab7b52d5ac3cf65 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.3.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.3.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..80fae44c48647882fcad549e1ddc791c4c1bdcf4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:645815f112b2707587ca145ee15f94f8f89a9555da47296f4aac5f87cfd88777 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d982c390ce26681b68ff4b042fedc805bdc15918 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e5789e1c2936024691229f1ed8ea344c0cdbfe20ae5d307570f2d2145bda7ca +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6554f25b63def2062adaf9d4a51aca18be5f80d6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e67646ff8ca9699bc561ce8a29ce5f6aa8ae41d612991adf248b0b527109d916 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6547a1accda3f993e72be2f6b7410a8b47000b17 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bca0dffd6a672f711a9c53a3515e80596f9ac95ebfff926093509e6341736582 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ca7669cc2762cff8b2a87b6d45c62a3efe01f1c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d62fac78f94f5a697af8a9f3e629e9ab02f0e374f283d7113a732da861f8fd3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.30.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..406e1b5d8113f4e00957b81fdb2f5ece762bd301 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07036a3b038d4800a1b92b85b55fcb176eeb9e548798342d33fd67c881bd8c4e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.30.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3ef3d32f9ef6ae31d75de9d518c1019d7c600d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:763b01065191c395a0c258be2c39e01ddc714e002fd915fffab7b52d5ac3cf65 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.30.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd374426376887bc24ba95ff8f09f9349a04240f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df4cc00b27894da7bb1b2dbf119c3f93e54a198549b60ac8259100798c943550 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.30.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..eeaead31fdaae77ecde9f9e978ed2f06d6f67645 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bba3cbf8764c47cb817c0865499307fa91ca0175ec68261bdf07f3901f0dd9fe +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..15ecd6a5e27af6dd80ddadb9411bd0ad9a876b95 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5caa3c73f9da4c4854f45256be5654ed87841845555c1a0ad9809ae524f66e63 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..65fbbf65bff6da890a5397f70df4feabec6df269 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:207f0534552443f21e5c92c790d2a6dc3369053296611c79d69eafbbe8d491cb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..91bf1268e5b0cfc219840b371d09669921cc8f9e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e71fc8ed9de3a6d582370b66dff3e718e50fd226d363ecbed09b1292ca19f023 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.31.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..200453ba53dfc9a306044244661a4881afe12604 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:409192c2e6de694704faba2e3aeb4fd9d26ecc59e0ced29f7ac7d2b4c0df8bb1 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.31.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3ef3d32f9ef6ae31d75de9d518c1019d7c600d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:763b01065191c395a0c258be2c39e01ddc714e002fd915fffab7b52d5ac3cf65 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.31.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f24b0aac024a12931efee7241f230e454d8d5e12 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05f910c2b93076cc108432b318a38db52a3772fd1cb362c7f57a722b2db2b545 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.31.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b317596a2217da60c5d865d463abb16313374adc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e76d4b4fdfbbb62e9d64e08901b266e1c194153b770e61b5857c2d3a87e7ab09 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..383fb367743238171d8535f225338015b9cd5726 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b39c02e7fa847931aa849fefe01074df5bc181d4018f0576dbfa9a9ea29354b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a5ce2071e43ba460a07356e6693dd050e23889c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b45110bd50ff31bafbe74b6fc8d51b370d696ec2c3b9d21aae4c1813af733384 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef5c00e149b205a745f4b03831688b5092b96404 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:297c39ae730e65d79cd9ffca3fcbb7babcc96baa70b11ebcf8add07ea02d9b4e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9769c3967930fb279a453f81990b50e8c15990b6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43d8b71af9aa83ba312bf1ce26d2d0a8e6c7307fd8ce59902f05a26b7ff25a2a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.4.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..83886b39e79d7272ba71963a29f98953da34aed6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0654fbaa73c882ac1d16f3dfbf0167b53a959efabfee529e9f5ea56b7559ca1 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.4.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3ef3d32f9ef6ae31d75de9d518c1019d7c600d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:763b01065191c395a0c258be2c39e01ddc714e002fd915fffab7b52d5ac3cf65 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.4.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.4.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7eb0ad5e553bcc60a5219d0aedbaf80e495d4cfc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0ba42ab045e30410db8bac338684b7e18486d259334e5546ec65586198c896a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ef719f8f2c775fefb58a39dfe91d8c3ade2e461 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e7651ae3a05de534ba612819a4aa03f0e857ae94eb04280bfa6194a32348577 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebf8dcfecf7a2e5aed0bfd9186a218b43b07a6b8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93bc612c863b86c6571aef63a01957a88181e562df4a8e741d5001e3dd46d765 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..56ad0ab6a7b4e8791e80af3ceffa80f5570fa0fe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45a4624e520666a11de6c137f4b677fd5b06f488cf856ef658398a3a2ace80fa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc33bcafcf1d9c9081686264816de9f315c6b3e9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6e18116e9be9841a0b31da02608dbfa69e88c3d031d47f3f48d01ce5b22092f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.5.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1999af221f7f1191fc67134c456aa52df295c180 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdf8fb8ab128142fdfcbdfff2dc49db9dc8704658a286b9fd56f68c70f61f158 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.5.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3ef3d32f9ef6ae31d75de9d518c1019d7c600d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:763b01065191c395a0c258be2c39e01ddc714e002fd915fffab7b52d5ac3cf65 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.5.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fef11b9a9bb24fabd31d657d17fd1dc60d61c5b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6cab86ab0423690d20834c0b07ac6a635a956b005e89f32c7d694c8a060cee5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.5.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b69047b7233cfa2308d2c2b8658a57bf3f942e05 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af3dba99406bb4d252f40217301e41df5d944e34a4e850da5db336c7e6adf264 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9aee7e10b49c9f02ed921c6509512c6e93bad8c0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a10b6a030c356bdb7c5e69d661f278bc3a970c3b94887ab936ed9ba788226af +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..949eeb8524ee3158307f7580e0ae734904bf9340 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ef89a453d0708afdbbb8a19ae5b0ab99d592b1832d3d9c8612b03088cad397e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..04ebefe88ebeb1c838da13bd76e38b436104d185 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8bb8cd25a085d084e06b2d73c333252c888a9fc53711be17e16d7654de6d59a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.6.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..61f77f1f67f07c338dd7b5ca182fd97e9bba6656 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:735088aea0c75f142b9ebde041609b955dbb0c7077b7003560af6813e8a40ad4 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.6.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3ef3d32f9ef6ae31d75de9d518c1019d7c600d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:763b01065191c395a0c258be2c39e01ddc714e002fd915fffab7b52d5ac3cf65 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.6.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..27e1330f503d00d4a83659c329b51ed6c119d6b8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:169bc2f0515c3ed68b7977b9d6b604d3fbfe0c346860654c132ca76e7898a370 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.6.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a40d734660ee5040b4878a360b4d80981e6e4c6e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3733a3d6b0fc8c8d4b57d2836fb14fc6e330f2ac7961839affbc311399e9c79b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..640f6f86b8a9fd66b57bd57a6172d486993dbeac --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b238091a0593ba54df7994137fd31702f418eae888850f96dafaeda534806e3d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b32eec24c99b605b0c578464b1f388dba42c9aa2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4da639cc3424340ee785ace378ba8bb66a96d2b6a3725fe40caf7c1e297d3685 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a117a508cef2c962a0ef515614018f0fcf6d2435 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1341bada428117a34e40843261ab167fdc2c62ce0a80b09e92aa4d01803a8d0f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.7.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3efbd3c89312ff4859b4d164b81c24c5978355a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd4fd1d11be0119c5f86f3905f2ed2882826f6e40fbdb9fe5af4a87132f3a942 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.7.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3ef3d32f9ef6ae31d75de9d518c1019d7c600d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:763b01065191c395a0c258be2c39e01ddc714e002fd915fffab7b52d5ac3cf65 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.7.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b382520935c964be5d1d65c99a8413f8e346926 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9772dddf1258d930ab4cdf28a2e053b15a93718a91ae026f0310eabe52a6c3f2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.7.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..71b6fb926cedddeb55d81ef2563054e52d4b282c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d532169e2a25c9dd3f8e4ef56889006936cca5ad1f16c124a73a296c1149048 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..efba03bc4a8cb1e78a24c37ad5afcd2161f5640c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c5371350620599582da6e04e3e5e4f626c6d180a8662c50fb07e032e393c1ca +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f978b0169a60d64b144fd6fc793e0d89c8898e9c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c3822b5a407236a0fd07b8e9d68527fed7b8fea49682b8f9bf3c3fe4710a581 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d6ec1f14044fce9319b5ab8d78662e0a390cad1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:078d9a38432807e7a572b3399fd3dd6c33e29b87901c4486e4e692d1060eb900 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.8.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..172aa7695f92e55e6047a1cc1cc71a3a5a036d8b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bab91036d0506b1c9f36a84bf6185d319101b0536410148edbbb23d678875954 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.8.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3ef3d32f9ef6ae31d75de9d518c1019d7c600d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:763b01065191c395a0c258be2c39e01ddc714e002fd915fffab7b52d5ac3cf65 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.8.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ed167279511a28c599587981e7e0ab75620ed05 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8705df510e418214e23d3436ca3f9d4fb72e3f66bf8421bb292a2cb087c7a58 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.8.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c87f1468f88c92b06ca2a3eb248cd9141e39ea4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a81fa82e63242d470e0c319bb583a41676b73bd1379d67dfb32ec7706e3360b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..317ecf5d3307b11f4fafe39b8bfaf86fde0c2853 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14dabe647664963d552f4676102890ba451aa2944319e325b4d513119f57074b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e551e5a027f074cfafbe4264b0d31399b62cd25d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6ae579e8f023a50580996bb2deb4432726b0b0f4adf5868f28b04553c3da344 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..840d240156c6f0691110d6c0013b0f87437abc18 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03f6eb39a0d75a9cf6c9164e8f5036655f477fd48c4e3d7e047e8508e64e8d82 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.9.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a49b8720edfc06530537ee4f423773758cc1d6de --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e003feb6fd5c6ff414aa9945fe0ad9d5dff962ea4a2e25bc8f0a80845df9f32 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.9.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3ef3d32f9ef6ae31d75de9d518c1019d7c600d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:763b01065191c395a0c258be2c39e01ddc714e002fd915fffab7b52d5ac3cf65 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.9.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..37bd5090617e7137048e02e648bb8b544b875b3d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ce70bfec5c35577dbbc45e5d5f1ec59aa5aef18d8389be43435c7008dcfd83d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.9.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..82588ec7e33984a6e814ca04f24b3df584551d92 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff0dcf2b82615aad41724a3ea468ed073b4d2f08e3b26e3e164ac85587bb575f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..48580e1d554906de90beeb759fcf15f22ca5d77d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80a03f62aef87b00746ea74255cd95d3b47a6acb38e04346cf3846e7079076c2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b80ab772e015106fe19ae139306fae71d5483512 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d81437e1e8f1eebaf478dbf1fe19610ce4fd03d83c7cd4823478c66c81e76da2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e493ecdc46ed2c476e5725b0c7575f4360a8a80 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ca304f987c1b8e8772d0e7afc53a4d711b5c41f9fba75b45531888b7122cda8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9c0f58727e3b5a8356418f0d2b7589de9a462 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/lm_head/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e09f5d5fe2000e8c89014cd19c97cd7cb130e751 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:904758a154c98c640001f446d4c1090c3d467c6c0f2cf531137e85c98eb016d1 +size 205955 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/lm_head/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..23770922af2e326dcc31b17cf8de98dbcfd8ba4a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:523b065894a3a9e6df42c2e364405483b558094c1cb97538d4386bcf8ab64ec9 +size 205955 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.0.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f878581ce5ce8d5f76299354e08e0e481d9b9ca8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee1381305e81de94ab396b27da4295667a403d16d85883135bd34d021e0c83f9 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.0.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6724dc57f22611b78df33339a35fd6d42f4a6b71 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c7375a008e2bef9023e17fe30f40adf9fdfdfb445c168d2fd7d0b423a6e1246 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.0.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..506a53d471a005788ff7aa14cae6a24f8dfe48a9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f416bc773be74ae9c440b8cb04f0aee2a6ad6670d946fe388c5322daa25c9f3d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.0.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3883a782c672c2d874264adb7f122816bcee240 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b572a529fec0918dca8112fc178886cf171fa51d98bbe9a73ff14b7f484f325 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a60ac7d72081febbe10cfd2bb8ea601fdc3a692c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b5065cf306017afed3a60bea224899419fcb29eff9f5aa987ef204eb529589e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..23e347610357cd7853ac0a889ea5284031ebf798 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20a49dae5418dbad4677df7806baad241b9da3a57cd4c07189f80b736df882a8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..288d48e428c59614a1eb896ba9039cd3f46a0ffa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c11cc15267c7049fb4385ea0e0d29aa8b749131ec34dcbd17840617e04050bb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..faa62a07d943e1ab4f901e4ec477d3bccd20edbb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:707a551ce2aa81f7fccaa1d5edc3737298a57ee459f7cb20ee1a323d191dcbfd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ef91e1259ac424af317f3cbd598b5fbb60d7bfe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e159ab50e181f0ac7af9682d8d39115a1f2171e783678dfa3bee2393528d447 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bde6fc02e43503e2802c47f45d6e2f29dbf15bed --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5936f31ee770fd809049fe67dc677450e1c1dd2283aa6039253ed2997ef6ec64 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6bcdf3d4267b6bb83f18abdfa318a27528df043f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c1dc0fdeab6de176966bcc6cd137a91c38c2c072fbf6914c6b7a64c06a178d8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..84e031b92d67d1271fa303c8a283927b8c57a0ff --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ad2bec6ff9b9311b10ae58cd928cf274b7ffa5d8c3f4a77951206ba729d6668 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.1.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6268598cdc3c73463bc4092c3148c4ac69a2d268 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f34bb0dec05bdb2524555ff2aa5eafbbeb4b76d53de90b5783eee0f50786909d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.1.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bab30cb92a1ea10add962e97ac1c8e72244bd3db --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72bd8ad92991dcc58c97623242270de8dab661b6bad2cbd3a277df51f12cc339 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.1.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b28a9bbd23b3299056d81d2525b290fa4565c341 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55e7e1487d3f07a76771c18d89a6fb794512a1d95e6e3dd32fdcde4d817ff270 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.1.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..63a35c975aedddef39d6daf865808cd4e5d169f3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e82091040308e42fe6c1c6bdf421acf10bf5de1c0c23824adbe87b001ad381ea +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ddfa5001b70c0acc666d1f065c37301e3083fa5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:145017d0622c6a6009b2c49402a7cb7c62fb06e97cc08bf58a7fddf27bf39e6e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7def089daf671d375bfc04a829a999fc94527755 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db97d63d00b64583e7e6d93528e3f2312f1d0e2eff81a90545d865e1fbbe5dad +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..26fdf1bc4117e300da9531b8dea4c061e5fe9c28 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e50671479105857ac64e90eb67406882446b96c2eb1c850b443fad64d40c7906 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae8922a5b8a8c7afd08103660bd4af029c07f17d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b9c2123f1ce4eead21be7cda9a5dd676ea84375c0ac0c33d49700832053ea72 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb3377ab425c489824d3b99f41db65fe25f7e42a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2c955259ac4ee2a3e63fe898ffb6619141a83193e3f15d748b1010c826ad50a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7b2aa2408325fb2023189cd581ab76986e4cfb0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d54c81baa67f347359db431a5b0e16f879c1bdd779a83ca5464a41c8eea2c41 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a16ddb6ed6d5e6432bd53f37e8e890dcddac5c2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d583c203cb4ff381080ffd60531ec84422da2b802fd677c9cda31e1257dc0155 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a82f56b9fa5717232950fb87c162f9a88078ef6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b6a48561d5cf907ea2002770ddd2873fe657cae371f72c7931c9d75ad49b7c4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.10.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..249483b7b4ef3b6680c91c26378c27ecd88da002 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:703a50ab399b118977dcfd3973e9594df90e456ad7bbc520e7d3d56e76ccb570 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.10.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..16edcda814697530af6e575224936ab5f7a00bda --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:591a734bc1b4a36bf074a0cba778bfb153f62af2245787ee4bd1896394ead99f +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.10.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..df6b9a788a95ba95859113e53c3ed597fde20622 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff472ebecd1d9252987005f3d7b5ff669f3b5696c8f8a06ef6159088f7174d4f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.10.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..25cf7734fd975849b45fdaa9db2f835441729955 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a2af5b66f5b9ae90feffc086bd6e84c72d512e5ee027e68d42ec6ab33c8fd38 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..10cc8d506a798f62a6fb01e6f303119b959fabc3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2484cf56a27ed18e3e48bffd3910abc611ad959684f61fd59df0b2efdf4c8b6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dff08d5624e83ba27135105026ef754ee5f8a26f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:620e18a930f78e2db74533e26fbcfb0d1c95155a19ac0767a515fab620ac6ef9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..214323c6d17322b319d97a851cb09ffdf601c703 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d1e56262431eda3719185a252d8e868ca336a2b489301b18e44483ecc9aa467 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4aaaa2a65a31d119489da8b2dffd25aab1b33937 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5efff52707a866b21bbb5cca1d90a538961aba14ca4b0f398b91a7a9864193f9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..926470c4782de062571cb8c53f5e0ec213268b6a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:056e2a5cccc57414f20a22b8f9329b21e23cdca9ff1edc4995ddb6f72733ceec +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b16a81ba3fbb30598e5b6f842f0b155a28e1446d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dab6927d9e1127d1b04bf8b72ca94d9c407b551d20dc4567cadad685bff58e13 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..445b6a3c5c3000946d375765346fc905879d4128 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d9d6d5297ce75214d6a2418a4f6ac449c842b64578c092665ac77b3510b184f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..128085a87ab957355a01557b087b17e3b6f50864 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:687417188f801210ee33341fe0a1840f218c9ae27d1328589f0418bda04e51ea +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.11.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..57108a77a61cbf6d2bd623d5742f1bd73605ae61 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7ee999bfa9cebb18fb38d2564b3c41fd46644ab59361f6c0e007bef2baf8c2a +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.11.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ab3140938619c52356bc061fbae8627f4430e39 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:434373513da0786adc049f39497f0e708ce71b482897a579045ef46dc773d0a1 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.11.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..54a16b0a23853174e46d643a1b9e967135fdeb37 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7deb221504fc1b98a2a401237d29500aff2c8eea1b2cd5827de57c9680a42014 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.11.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..10dba1bd860820c10fa62df04eb58140b4f5b921 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0589199800c398f1ec64d2a7de06cf760de3481abc54f75e517e6aa5363145e0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..53bbdf228a7ea2b724f1908507f15168ecd07803 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d2855c8e360729c825ed74dc9c8b09230f654d0b8e387e83a7b11879042a395 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9dc2c98c9599bd6d7ea27530f9ac780dee4d25f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10edf8ec75df46b941b443cde173860d6e83fe2775a9e898e0391ac1df032752 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1995723e4228cb300ec777df1b32b323f364ce66 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0487574ae995bf7b46f9bd88d2041ae0f09e6f459652d2bec8dd747ad1f1e05 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6dd3882d74b18b82ee4e1c25205cc3cd4acf4e2b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53efbddc85e2e2ae37282cf890754fa479781b833140e4b1a63c6a971bea5087 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..179b7702bba95949953bc3047fd1787d868c66d7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34380eca8bb0bb97fe2c0b1b19343d6fe169138ed9933f9bae883a47e80292d4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab4a9417f9f2e1e23f01ac88f9c2b79723ae4bd3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:323a8cee40ae8a365bb3d8cc53de3d3936ea7d04674f36365b7790722760905c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2929e40d4c11a69ff90a4fa10b51c85449a70fd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1496fe8fb9f1bee89f1a5605bd9798c09c3a685f00c6375bf8b844bc982c33b5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..426607160e0431e41eda511830678cab868c2b58 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdea1c0e957715c6141060bc1631cf054e13af057932d459f3b818cba44461b9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.12.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb363a7065e607a2e4c29f5ad8afacc3466f50b5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06c28ee33ee31e72f4f19591228216044c78c8ac8ed0ecb5acfc621e16c0fcc7 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.12.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb8a5b961ddcde3b9da9e855ce625b7a4458696a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:512d13fb09c1a6f8921a95991ab6cd29080464ff92a16728c763b83fe8905d05 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.12.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f2e523c7c245bc9eeaa259419a190c0f9320b5e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:651c02cd95e7958415a10fc9161f5b10db7007f923433122af0874ff549305ed +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.12.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad7aec0a8833eff877e57bb6e01395bb59076fcc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae565eb74355143b3f36d75fb075d5122acf8de86d59e9866c1719489dab2208 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0096b84dec9d59ba516d7a62942bd05dad55b08e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59743378391e00ba13f5b30aed88ddf0fcbd883e3f709551cca333564c6336ef +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a583c3b11538b334e4f830736ce33367daab27ed --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96af1faecd111fb8cdcff10d5f4012d435b2087e6f743caa04e6e816238797db +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9635e28cde352c1c33f087b77afb1402ce54a271 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c081a3f3ecf82cc574d14e18a6f3295cb2da91d0d8cfe6d24a6651da170ae565 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..40427beefe71d8ea6c4e3c1ceede0128240998c5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f60c79a6301c1f7e19c7cd2281900d3f2945f3575e6234bee6920208f3a4e6d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5a06ca55ab26c4112d181b103e3a59910b48d05 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9356bfa5eaab22857680db85e68e8b5fff1cb0f58288779fbba089d072b26715 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c83c0984b29fdf3de79de3a4e49fe5a5e7706a9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b2b415eeb622aeb86258ab5d04f33b54047478da8f661a639412f516e75ac23 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..17378deb99a9a0ee3fab1019c2dfdfa7a44a9cdb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8ad16bcff3e99c12ff7188c998aa8ce60f309c52962fb3ae152b8d6663e3067 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..93065d1c23976311c5dc9d2ee92a5b400076fe62 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c3207541a3b88cefa2729d4aae7f8a6b57acb0ed0a5cec13fe5dc26b0141835 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.13.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9171252b4a6e12988386140aa71d4164a26b538f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a9d5bd9b9a07315f7b62274939c66dffc9cd0ef3239ab988911c862d644424d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.13.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e0c3bde2e3457f8e8db9788882efc2b9b492a70 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68cd2d24958e0edad363af8161379dd7a2b57cedbafda05b6fc41642d810817b +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.13.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..693e2dee13f7525c7b6701f1c86281b4d1dde436 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:651b78fde3774d273576f1714a75c19758c9fa2f2257ebc326dbe59ad03ed4a9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.13.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d8f514967f848a943b2281f7df070700bc7faf2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c65efda896d576998af41a39d3d791dda30aab5d687a15c84bda6be95d7ad263 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..527cfbac28a318bda0f936480b1e70b3aedd6d3e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31c69408d1c2bb4d71a6826745b6e2953113cd3eedc1776d2840fc2aed8afcc5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd2233d13c6949da3f9d947af8696e42d6ff6097 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:296ad083d2b38be9311acdb9e07b77fbdf89681cb685771193e5c3111a06609f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8655c23598686aef2a0cad69f06c21cb87197ae3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8005d0a4715e4e11173f79922808f50608ceea52c1ee4f672f46d2653dcbf51e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..07b5e9718a409c71823dad424bd62f0deb0d066f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d040481089270457c58dca7434c052b28800b607d8da4351f7a81db1820a1b43 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5190b657e0544950bbdcf0e860318f93fc08eb75 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da658271e5cc7ccd528cb0100907adf6237b3e4fc3a6934d13dcf0f1664a7cfe +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..18ad1d64abf2517779d72cd35f8cd2176cb57884 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43f55331124c10ec777710165b3afe92f2098d38252c80b5bb820e584f5d83b0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0dde69fe2d146a6955b3946c4843d5736c9fb5cc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ba62573eac08a5ee31d32ec5b1bcac227dabb4d6e559d08e73e57f73af1e0b9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..92a9de38614498201883f1458f796576f3c825c7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6d642d7c4d13b42b7603b2346b1e1948637464b753d7ae0ccd4abf26cb6930f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.14.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7635850882fe507399b44c9ca6195d796ad31b8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a15e349caea4adf2668b19ad8f1b4dd889cea87f51b608514af8339e8e68d9b +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.14.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a1a7fdd2e564f9124f0592c0df3f2e55ba6d489 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f8084c19995d55fc9ddcdd0537ea431899b43e121527708f1ba6f39f425d884 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.14.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f603cc7443dedbb08d39a18de54301aff0c41e2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7959fe20a617b96fe5d11eb4fa5cf9697e51554198c644f8362fdebcdf73ab9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.14.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..22f1db231684379bf841bedf38482c5bb8059e79 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2ae856588cdeb75f79c3a453b6e566d37037bf0cda1bfc54a29225f1295001d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3e493b9830eb3268292f3b2c1d33660b4e090ec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dfa44defe82435d46da031b78801389c3cad82e47146a8121160f42d157f9c6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a90ceda71a8d744d401b30a11e73fd7f8de470a7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9ec8cbacadb686deb2f7cf181778f6dfa9f33909c01fd2ab65d80c51200efd8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1c0ae7f8ce58bebecd7d344add94b8146d8afe0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67e088da9350a6ffa04d45a931d0eb6db62c2e46980d3402cf2a199756052d2f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5302f376ff75dd74c2a1c5d49acd0873eaabea6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b713178944580fd7a8bb3d9a0095f6356cb9907349b8b96840522c993174a54b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1930866eaa41a9eef4f9ddab30360ec219dfa16 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d50c3b67d89e27b5610f97edcdb54877f1ca782715d62ae2d1c63d4a9380306 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..64405d1f201f98d4b7a91122f48ce53fc0ea2daf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92897f3868f764eac7ed809a7d75eca0ef3e9ce72d71b7cfa755d0967c40e4eb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e476e79cb5a8e37509525557facd2feb370dd0ff --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d8b0cd97a21a688f531b395baffb4a32920c1498d1bd2a68ecad1e35d085922 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a2ae28820a0bb576b2691edda7473c80c67b152 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c548e1e3a96026d427960bb101cb482474cf4938f0af07412338f77f618e6ae5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.15.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..075f4cbb3bb682a634b1184c3f5220cee88405cc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec14c240149fbf84de52c501e59d59e8a230fac089dc4e61ec0c6702c1191c09 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.15.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a287c5d0779c63004e1e6d1513014bb8c032766 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f09b553bf4f47ad18b9ec5daa17c7cea7c4783985d697edb7fcadcd782e921ce +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.15.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5bb71dbdf39c7ef07d93b63478ad9841cabf3fc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51f8f16f840dd460e5836d29b44a556a21d41b624e24c87a5f66bdd4a67847e5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.15.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..337baa9a5d17d88f46c4d0be9ac7b2fa1417137a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1535a8903b70ea6ccf71757f5ad51bc2d9543fa712553d9bc9919044ec83bf3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3253ac9571f3bf7d0616cad54acef172956f5bd5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d75f862b12243baf05396b744f37ac0064a73f609e64300b16ee830993881fc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cccce7aa4d629c76a780e585b0633ace47bdd1fd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e203a789f524b1ce47046fad17314234fcbb91810029ae5b8e01d14f05715ad +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..55ca1a7a9ed63bd6d9d9bcec76738dbea2312207 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87c91825def4382b5ac8677e642af8755c98e1ba27db7e8b10550a0e71b6dc8e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..63219dbb7969a2f849a6084f36f8ba5ee0fafdab --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:814fc31e8b3d5389d30ab85f41ecfcf16594266091a038f108859ad1fd30ff72 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1dc7eb2958f0adb50ce2bc13fac4e9391a609748 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:409fe26a59af9007533c289f7d332051d10a99f52e8ac4223f4e99b47a9764ba +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..08b88d2af3ad217fa3244d346036cc5a7d920e6d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a13ad887520c9003a73e68155b7e27c1c0aa9a3c6d96eb5a7c1950e64dce1495 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6ed831628ceefb2c2637265aa64c5afd5029f60 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a361d3408c032143fb8c76d3241c5d50c1f5db701938ebeb01e061b3e685655a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1dcca8cfe6711fd4f1eb2bc320967c55c97d67a5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e39497999e8fe34a35a6ac91fbf827dd2d321c1bcbbed8eac37ce816f5c7c6b0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.16.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e3dfc70c8c3c73410e02ea214427eb64ba86a0c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c726f3e818f2ef3de78a9fe06470c9db5e0b5c8dc33dc27ba339ab373ed7a718 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.16.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..42ef9b79f8a228942603f85f5b5e371dfd3a8a2f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bd9a759c014850415210eaf6482e199d38f6de11d25ef0df92b2ab23c0277aa +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.16.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..663e3104774a1592bc3538cca9f16a2bf9e81ac6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:275913ef05467be7915bf0edbe9428fe800a7490b0b4065d44824fc272c86eca +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.16.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7910b11c1f2be12f2460798a080a9657f09ba62 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:242cb14121cdff77595168f63b5072a60c84b6c0b79cbc5cdfea8a4250929f9a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a79c9f1fbe512e4d4360d100b597874edff7cc8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59691b768cf0c6abe800a021dbf7d5a61d292f0417c839c09c48da684410ce70 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1ce3c9d6f1a2d6c2aa548e213eb52e490da24d0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abf9cd7b56bf6f2329d5d98e0e51e433395d820786b66644f826a88b81481e62 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7d031982c09e295847e30c67694f04998d1d0d3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17ae4f6dfbcb893e83bc0247fdba028937356e9bc4621f0948e27c1ec9fd64a7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dbcb197029a097f0412e58184f20d7c89e307d2c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f51d320c54dca4fee33cf2002efbd70699fec5f23a978f9411856b880d6a7b55 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4aaefb2073f0e22e394632b05ed705ee71fb7632 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:809926c8c088bbfb3f4690bcb838c5913eb3e67e9d3cbe2e96b66dac37ed7f3a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3519389e9e93bf3ca6d5b32bbbd980c609a2c2f7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fae4f83117da6b48aa411f10ff348161de3618b2942e89522a254835214c39d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1324e70e8f8c8f1f52542733e517638b1e271198 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34bfed9879860a1e62179a4b90c9ad04757c9e55ea85a5da46412684ea0a495f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..efe2b5b7198ac028baefdd552d3ca484fbf2ed2d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a7a2701aba099e1396d5279fd38792d4534786ac7a5553ad351fead21b5e458 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.17.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5895de3df648a7aa40e9f8163a3906369f3bfb58 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb135b17786049ac65acf67d5fb56f9558e60944084bdf1ace129a3b735dd256 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.17.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..63b20445fef685ee6f1010764e8894f29ae2c452 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a0886656f26fb8a40350143ecea9915839f2b4ea30685e89220d33992ef8204 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.17.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bff0c0ff3de3187ab428de61836f404a2a232cd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:467fa6b787d909113dc6e6dcadef60d29f9aeb5df5df70bfc70bbefec0341394 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.17.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e6c19bf9230d2e523ca790611d5c6afc93311db --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab20ec25337423e6afc8e7ef08ecf4a9c1f855675b2140f1fa3220029abd7f3f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..84a5287adc13746d70f563b48fcc81b2a17d028c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:604c2e6c62e7acca54f4d6c6726146f7e8be86d3f36777c6a627158a9eed41c7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..21367f59c1eda377e1186074b7b53752eef12904 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d15096b9ae4b8fb0fca343143d3a2ea5cbb99d231cdf9318155afe49721e387b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b12d6a8e9f908a1ca52bdb2d543eb84ab8fb2b7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:326654ab615bae0ae9162e70e6de419d5dd92bf615b157687aa14fe7584d0ac5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4bd7c301b2527abe266dd7b8f4febef9ad69c53b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69a84d68f3627c65d22db6baf797cc928eb48e87e4932cccdffa64c3c1a8991c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f78e8ff257ddf81a7ba37d179834f6d0ca618b5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c799a7d9e3ed62f9018742831c7d67b36b12d61fb65ccee5f644f5538b375d3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8701ae10b54da46a227493fa8d985131b0e6a578 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b5494d624dddb2051b53a36c59bc9086eb04df96e6c8a7ea4a84839c7722d10 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..44a1ca3479d7579732b92a0db7a1d3825e69fd9f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e03cb9895ebf466c6dfddc39fb3df420620e48a15ccd9932c40e59c0ff4a3f87 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..282c696b0e9cebb8cda6934899c4b4f576c93d44 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e426162e2b3890e5b2007a701111895232e2992db30d24928d8ee130ba2d5e5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.18.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..30704dcc171250090d3a3723d93441cff8d1a23a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e321ed7fed2f70b5b6df87e2c683839b66772dbd2c5723f8f42d16df127749f3 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.18.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..56ca7ae4d3243db629b10241af6e564dc9752b7c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9455a7de674f4f871d851d3b5c5155e6b4a588a01a9a9df150b001c644dec76f +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.18.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b857cc0a74194e29ff3028f08ffb4281796d9e5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:babf2369ad59476c8d4f662f079a32ef6fb5bf9c95341d08e1b5acfc7825506a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.18.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..95414f161317fd18599a46a11814bba96ff278c0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c60409cbc4b964e14611431bdf33ba0ec0622d82a7f4396c983fed989fe4171 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a934968cd704feb58e8af253941b8a7f43378f34 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbcff0b8121f497937128251c86555049ce85db3a3dfd4aff35d520f14f5a3ba +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ec25d518629b36596a865619044ff6212d2b350 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6234c8d856e0369fe9933c0b0b6eec6da03afe582a31dafc5479f49f1223f935 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ca29aa86c972745855b9a76bdb1f768d991a872 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24229970cdfbefb5b13861f66320813aa21901b4d3200f5a97af867d8912b654 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..880df356044c0f32419e397435d80d1353040214 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20aa5ad78ad204f1c2177982e55ca5cd33b357f9b90c603ef8c891422164d5f3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..89e8b63b83361f0d6c782a44e652586f79d88b85 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:637a8fc90d8b7a5b399ccad261f2082d36bc82ffb7622be6c24682936a1d6edc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa302e24ad6a1625c92120fc5d43c17354e6cae0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2eb6589b66c165dd25005d95fe3bf28a6db56f8f0b89e9d60eb827266689659d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8e66a3c202a2e8bed6fd7b847bd960fc63fee5f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18a9b6c05446b04a12250007f17b08fbb5372350300c3357e05f3233cb7e206d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..49ec33f5d54e998fd8f373f3a83eccd9dd1fa96c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbb59678a91b6dff538adbcc01d074b641ae02a4aa15c9e01d5a984fb86091dd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.19.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e45a972fd73c6148468af6287184bef1c8471d57 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dea34e4e599eb5bb034e50559188d115eaf246cf576caab0d149eb116ce9c012 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.19.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa92609b449c9e24b49fdfeaa307e191f2906b05 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1f65804e077d460c866c15eba90aff7a71abebee3f41315d66477e40d839a36 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.19.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5431bfd386201abc0232dc63be04c55ff0026df9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a0c24462b5b6de4ee6ffb4902cbf254a64be1dda2312f29bd633cf8ce3d1605 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.19.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f0c5b493cbd50911b7491de762b7926fceee9ca --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74ac54ceb523af38f8552614d971ffa9550df04ad524301d7072fea133d85f95 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bad2b0cdb308abd501d39d7371448fda7630f6b3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3fc3f6c7d342d35a307f4ce70569c78368af63c261392597fd554c3b9f0bde5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4688a3094e9dbe51b4dc0013047316434c05664 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27d56fcd904d2534e26bdbb956cd07887854031170c946fb51e14f8dd97f86e3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..73e88ccab147e2cabf5d613a640593348d81cf2b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b452d1e4b1fb29c699c7baa2c886a5522ccbbad52d9be7a856b8790ad13bf95c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..08394e2b7384fda71376d705db73196ea61b1fbd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84bc6f7799f5f15792dc10cea78e4450b3b9f6b44cb532d1161f3290511b1edb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8cf4f8233a96e04e8483cf04a0c5f2b191283777 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffde6b9431a22324aa75294197f07b73bb7773e2f03c0bb9e86219e1406e3a45 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ba6db7fe1cf9bc00bf7284e9eeba8374206a2e8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54ef6d0a5306387e40754b03b29d7c5c5aa578c5133d4dc5c4953d59e8921673 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e714ff07d817ca7bab20048b23e241b9dcc93fb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fda0f58df3f641a8f2046f6aedafdd115de5151aae730f2e4116cadb3be89c08 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c0cfe1d12b94d115d6f6df2aed597336e971053 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44a22b4e1bfdb534777bf6abe1890d8a01e725e07f33fefe79c6cc2e776ca7ec +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.2.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..06f2a599f152e79cc73079a58086abce8ed7ea0d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87eeb074cd255cd3881ff47f4d41f7b39ba52ed8c9c0154cb2def39cedc1bcb0 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.2.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..568384559181f25f8c731493f92640c4b9e60e00 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc7de326f10b56b6acf5b5618f90bc734c08012e1883e3667f46e82cf28812ec +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.2.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7cab4e854d56b5a8c6b9552696debef8236176ff --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cde10519df6219532a5ebc7a47d91fff4921074518a996ba8e1f9272d093ad0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.2.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..023ae0f70b9b70fad24b2a9c09fe4b9baf670835 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8faf70721dc614f619d098e258a66e890a000dcd10af6d90e8de72f2201ab977 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..27ae7224d56c642fb01c8e9173f5a6d9896f4164 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbb149b82b0bb1ade5b4644ef74df5f6a80e03d86934c53602ef73be84b074a9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..73646066d1a564a17e0ff5f03c4b8039e4ad3ae3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb241145ca0a5d12458393b21d71e77c3a40cff92fd5d8a623404359ab4d0e3c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..247aa5bef3735ee75b7997b099ddf732319d294f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8efe762cb7ab442cee2d36af31a8db0a5c980c2fecea3d306d3ae8b4754d9599 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8235ba380b9092c9d01808bc3f39c9fbe5cc98b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68d176d292bc19a7aef698f8b03e770752081f4a4c75ea1cd028ea9459767675 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4e4b999ebf320bf5657537e46445e0f4d3b04c7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bb4bc60b6332a8d803382efa4eee121ae4608a8d352ca3543c5efd04cdbf19d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a0f63e3460aa95aebf7b92d38b0047a4fe94403 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3f00822826d38daddfdf460fc6ab5b362ef0493adf223cbd4a70125890be7d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c4609a830780ad8e8b810c0ac81e4bae6acb4da --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6926eba6542817948ebd257e51b71c7fafe5dc31d6e28c3d3e83d246a95a4c58 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..85f1621219d60a57b3941132b67655b28c3c2cc1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca2beaf3bdeded45b5e65bac6f9c90fc0242f2effd23a5b1ec065b706440ef4d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.20.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a1817a2bc8a297d9617dc431987b754e865ce2b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63d96f672cad63f06090610842354fe3b638e9941802e264ddfa667299e422c8 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.20.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..37cad253492b1df7919fc7e2564fa95a14d5a5c5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccc94de866b9f64d35adc7d37e864e6615490e4350619d748149b02696380ae1 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.20.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1122d2e10d76f1337c9e25612d3f8a842549a9d0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:692292e754c2b054973a695d3dc6056265a7dda4aa69a88099409a8d50a525bb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.20.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8dad33b8e74a8e6c4195fd21913445eb05494ca0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55a103bb2d4d1c5eafef21b4b8b64adde8468d48c364f6ee2b11d13bc5b9c50a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc16ae5bc6b9e04133de7cff6758be0345d7b400 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:549705e5c77b09b942915fff1a4c83f995fbc2ad882735862841d678a870277b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cdc78156b520476cfb047c5a2323b7e0baacb264 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38f6d97038d2b243f99a8dd52c55808bb53d6e84efd31e56a5e64ef1d11f36f5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f7ec12397b1d453bf1085514f373769751250bc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bec19418677be7106e81344ee1780a7da9a6201648ca88bef44aa8f4c549aed0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfe0d76346ff67ee26ae0423e5116b8e8d577e3f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2909d740151d8440ae71e18204354f9151bc34bd9b18b3d32cc3101c186c7420 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..785dabaf97624cf4cc1a87780a79eba12508b61f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a1e20d91678f35d9ae580e6bc8ccb55ad3d6d85707185c753c17c7d55d65277 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..95dc0f486fa8c9b57054c8fd73ea201e3aa8add2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3adc996f58b7dd25a92ef4d0494c9fd90462f312368b6e8ce481009dddcc7147 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac02bdbd624f7233ed4cb2dfd96b376e2f131bfe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e37b0b8b145c80f86a98cb5c9981dee4dac86ab97cf37ddb8289809dbbd79ccb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..162f84f5a954e4b867bed87c7aa4c47682e7ef4c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56d70c840e50c8cdd19d0e0bbb01edcb1d8de7304a625cec84964c4bd0cb7dc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.21.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c7d7c8e5dab9ff86db1dfcaefb3d62c4d5e5e09 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a36ecbeb805a953d01647f155dd0d1cd8368efff64354e02b42a99f08796636e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.21.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d61b237bec051403f35c6d4414da2ad1416f38f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b1ecf33b9adcca2b97b68a28f25e3a3747ef270eba5f52d8840ecaf5d2d091d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.21.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..17ea5cd34191fe511853f72885e96acaa8f9ecea --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a967d58ec00c6ecd8c622a03e2b4b6a56260aa3dbf4a92990ea0bccda6e543ea +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.21.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee0295974c7f53bd945d05d092182b69e29fc737 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be01308783fef1178715ebd24182c1a13b4470e5749b178dfd6bd24fd72f13d6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1612c141ad6089a90029853fc2f2f934c532b06 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83dd6312c6ccb5cf5868a2b839e623663cf889df06ffdca012399041e9d9a8c2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b6c8511c882854eb65abc8a546f7aeecde0faee --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46f9795a7f7fd5a864a3ed4dc9a0cdb74a93b054cabd11bd76d9fb328bd62cb5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..63c1373eebf365f7099cdcdee28b244a622cf998 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f8111f3e4d6c2cf48ac4f45041e1a9b37756ce1b6aa71acd7cdd7df4efe7b92 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e3d91923c893f6b3bef44ddb2fe47640b74f86f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eebb885480c5d28fb308d5b4afd0a5c737a87c19a70911d862af028d7283d92b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..48946001fc729348217a83bb50a03e37a342c059 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e32204f0738e3f2c73a424e6db059fcdbaf4218850b6b962dc3254fd5f9ebbe4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..addb66003290adb1b3343f81c54f56faf43a5ea4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51769a1d35a9a2c59e4c11b686dda640ee0a576928d45f3075180d63bf149f20 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6cc6ed394035037f82387f735df91e8b7df6031e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94dd438434ebae863d1121426cf5f81655e10ad8950bdd7215ebf9f851859cb1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b495ccd0d90228c3d3a90c1bcae49dbf319bc54 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:413ad5b3986ab0edb54f6b43c3ae5641d4a00cbd5fbf8ed588ae6b171828b311 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.22.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd65d9de32dd353bdfb9ed2215c588b3abf54740 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:443a2d30924e251ae8a83b93c7e9c37e7587a9475abfbb73836cd9a341e25985 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.22.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e30c9b076b17dc162c914702d47f26783decf711 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26c28eb132db2ef526b9db1cdd855b8e4da72d370c94bb5386a54e5fdccac36f +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.22.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d172749c9c66e5cdcda8451555672197b18b5235 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4b3bfd36e76f039d9a5a2bf4358d89007b2631c8391cdf63dcf997d1fd2d6e7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.22.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..70ac7b0cd1478867341e2f7f6cfbae69161b44dc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bf88900734fcd6d8f5b6154009f92434048cf86a77dc1e47d67a1528108909c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..19ea0a9e11d66d849d8fd34b735aa1d42c4c6df1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21380bca6566f78524424c0595b7626d08a1b0d7bc8b1392712a3bfbc98bbdfa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..77036d7e84109d50381c50370613d15ec2713825 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b824a5f1ca6bc3dbf3c21a9ec3537a44412713ec49074c25c2ad5496dd12db6d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..114238ee54ee22769ca3b5b0c5800ef9233d2cec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19e247e0be97cdc529a98e48231c09774de475a381a101b22fbb702a14897103 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c4069642d2e58e4e047e8227ccbb9a6f7760362 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03c8b0d45176653d24c9e2aa97592f6008363968ddf5afcb7d70c657522009d3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..08643726fc7ce55421127f4ea6dccd6ff78c3529 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:917970b83b1b4cf0b1f01648e29b620fee1c0a7c5c93060b9cbfa14a7a3da53a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..763f970a60042e4a75bcf846d5f4ee7914d22efa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:544d8538e08b0277d8670e497a106420d0eb05f3ddd050a3e7913e27eecd4e93 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..69d426498838ee3009771eb3e4563dc4708cc229 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c75612548640cc9772dcbe580208be49bcf0613f5c07cff0648f3b9cfb03720 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a1b9aefcf43328c1203093613913628fdb27bdb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ec12d86235479bd333de33f803196d44af5ed44356c7d1b562710fc0fe4902a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.23.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca99e56e33c277d102775384f35787ed2961c637 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd7ca59d75807f151cbbcf225544c4a8f6ae4b8d22d78b3262e31d95326b6664 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.23.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7465036f862bb24a0e93be1a7d1aac81897986e3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d543bc62c99acf94fc2442400c8b74b98c1f3d58653f27b23686a3ae4597833 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.23.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdd4817c8633f68be29410846388b9258cf911d4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9d2435378192fda74d4a410459abf8fd6a509525afa5a0ef02ea1fa010b8a64 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.23.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b973fa2bf88f55477450a2ea31047ab268bc73ae --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:908cf8bcee42b675bdec1930ac33440c9866757b0a520d9155604b1de817a457 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..53c50fd4375a9cd588457674feff56e01dc4bb55 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1e858843d7ec4c54ea592c74754b5962a3ce16d669287befcd446b921993549 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e38e83bf605a2c1d9e51460a1d2d403460fa1ae1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85803df352e4f5540a2413a6ae5d8e1dbd9b4f6aa0c6ad1ce4967808f1ba7d97 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4cd4dd4ac73205bb477fdb17caf48bbd4c96ecfc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f56c6df02c91c9bd6e42e09802129ac883a193508cc7f4386f98d5acaf39bdd8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..59c937035de0330136ff9a6fe17bfeacdc9206e4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b045d2e0b303bf2f9a7aeb7759dcc6a49b2901e08cd2d608d99958383956f477 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..580b8083b3ff651879def0a1b7af0f107158bde5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3efcbe79775478969e991c492228be62aeba1b9e5da26e70bf29bee6d8731dce +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d51c97efa649b32a946713033843434d234bacb4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25691a194bf47e0d9f29e3476f36b17cb45b67d0edbd4f94cebbc9da2b83e344 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a779a4ad7d34735d4573b7858059873b22ec093d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b55018b593e39ac6610497eb077dc9bc0fd4b7e7aebbea32d8a2275f447d9f4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..feaecb476944ba89fab0fee9c36e50b1235792cd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f922db076d87b1e67216fbf6704e3b897a4bd1fb001d15af2519de5fc7c13834 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.24.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d171fa13d18eb313e67a6371c7c263062b8aeb5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1957604e0b00d6f7d7d5382e4163f78340601d69941699ebc0d884d63d620f66 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.24.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b638e67dc8e738c4fdd1c7dd4ea734b1ab644c6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f430aee5ced5a4cb1d8c1ad3e5c7d57792e7646291f33a69166835deb7ef68f4 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.24.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e816262a03eb9cac586437cd15fed89ac0007295 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dcce2964fc3458abe9af858c4dacb0f179ce6ccc62eab1053bcb666b608d74d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.24.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8fca5d0e292784c213a4c3f0165a9b9e8fda67bd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31e596e55c387ec2e9d1a1d5b29b44973cbe51ec4b7e01d69515596630d2991e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..90177e0391b1b3ec8ff24a4cd1feea1176bbeb49 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37d833bea69bb59e907209d0dc0c6f23f4df89f13d60ac86a120c86a26078f99 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..14ee2dd0d91c30d8dfc11c07c6e7378863dd60c0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:341759bd9ac05a77253e538974f60694af8ebb1606de9bdcfc164969640c5716 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b92fb67cc05e1b5bd6f2537c867c903bbe1b5639 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e80ba230e2069e2a88ed8fe4ba60a70fad9c706192d4b2fad1d836ca46a3d8f1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a050e35a57b06e34e5f05f2da68120d70d30191 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4134e144393c84fd07870dc46acf0a7ed75733e8446fa21424db8405a2547b9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..668bcca0d3e5bea4d3ce814bb53b1ae77667e8e7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e89ed81e94ac05b016cfa14ec947e210f53388e459f70e26f1cfad648a63ab1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..71982ad22854bcc54e59047e8ad501f36b644f19 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b583081537e9f603d3d6a1f36f35d16035775724d8dedc9bfe588b110a47309c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1488cbfc1a13391f299eecd5afe8bf8dbcf64e79 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c206c87bfb3de1a9a8da1c8e596505fd4cd144f4d75391fa6349d746a6a28af5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b44395992674281258f985734f17d215918430a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d258f0954271dcc0ee053b758405c2df0de0d2d79901f76833b31045d6844b8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.25.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..af9e224bb1d7a2aaed2249dcde856ca9f5c817f2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10b80b3710fa3e2c447f08674b2e2946488d12babf3192126dd113bd60d9a93a +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.25.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e6814e3718061268cb997026d8b25bec07f32fe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f248b8a3fe7ef1742ac96d661be49455c52a7282fbd628ca9c2a58f551be666 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.25.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f84532201dd904eb402740e1081c8e0cdd505eb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86ffa445fb69061be3c7f7b88e7fbfa80ae28db3965a32e377fb8ab2663bf827 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.25.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1812c88bdefc74a2d88977c010d29a82c7daa06c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64db6de20dd34805085da84f1a7751d08c30e82cc4c9b5675655bfc183a581a2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d989a471eb4a2a74a4ba3237b97e3c7d241451a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3424a451bf7ef059180c253295a753830e4b3c1c3ebd886b00488d1fe1ffe710 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b2ff47203d6b7ca1ae341cb7cb40ca27acd43ef --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92876be546fdef80c568182ec2e55d6be2d35acb5be8ef3a1f5c30cb9bed9832 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bba32c92df7a20ea7ea7a87025f4119ab352fad8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65f7fff3adab788f7ccb15915208ee64dec778a8d6e4c0ae9069c3ba6465335b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2abb8c062c61886c1e2649a8bf4474e804ea31d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b5c8d071bb4f57251e63e4d5e8c9964088d9eb2fae3a6965c46cb1560287e41 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0578d5075c87f87ab27bf28a3f44f44958b6f249 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6565b4145765c16570ce56bc59f0cd821f20f48a7c5f57b97fcefa8cfaf9aff +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7a9cbae9883baac53c18d1c7f86f69a6b6f5da0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:746f680cdc6652b39fe86205a49b5e22c268d9c645c056842c4c7fcb9026d273 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccbfa0be689432836043b4e8f04b11e21c244432 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e03c98e540529807ed12e2b2ed75f543515d9643123ff4a8f870dd1d1ee09122 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d85f7690f3d4a481356e7c946f46d3d5cdd1b242 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34ea787e93dc37ef95b922b77ba4ea131788b979588e829f4c6b886f0a95045c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.26.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad3f5224b70f746c3b2871d08e15a572f33dc409 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc8329531a2192c20417420c9c05bc0616efd89f05d50d7e58bff08162e30a0d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.26.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..df998d01558486b9500e3d3ebf7bad7490503a52 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51470f3a7f0db0f456f77a49499388496dc7bb5b337aad57b6e7bc7b452235e9 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.26.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..db53a56c2598360bf67f09a7386e38c2aea6a542 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3d6eb4e1d8cf401cc1899be03ce3fe904a584240eec5f857fafa6fa5a36ac6e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.26.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..084a3a8e16c6246a058ffcd484cbfc87340287d2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19303f9bdcc5a09a82ffe7fe73cdeca7abe88077e9df1569abc10c4c5a6f7994 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c80502adfd5160d502448b44768c2eaea0e16a1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3fddb8e61cd794870f28409bffdc1656da230bd8a9396ccaed8d22ed8608b19 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c58fcf8b1963888edf7a3e7e535f2e680e95822 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1e984f8e244733eba265f40fdb0f2ffa187f8d93db948b8f9181b606f37372b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d5b41cc4e0c125f8e17ca4d4d9e48575507618d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a7040a592c53b8d663a1566a5e025636a77e2b1cd69aa46fddfe82df498efd7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..02bd8c0650dfcf3f9e25ce15ca2f90a3603ebadd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:913a59b8d0e518bddb8225bc57e063fffa4e5d76a93141f1aee1e10e9a79bcca +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c96f2b866f803bc52e478ddc99a8579db04d77e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec7e28ff658a4f0f3be13356fbec0654c230819f94c29864dd0a1f46da44fa42 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0965b6c7e4f401285a283f49ba023902c10a52ad --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac6b82fb11d12b9d4696670e07748dc71f8a623a5edebed5437c7f53fe8ba4dd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d37fcfd1fee604c55fbf8734035678eadc796ea5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1d97720ed4d6fd18f0fb116898f1c21448d885cdd2afcfb25de5925494e5a44 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4956b497a846436e4484916a2d319b09a5a50367 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7f397524c28e6a09e3899954b3467a86fb3ee1dffdb5bf699a1300482935ef3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.27.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce33c1b8041842281c11e20a266e8a2f8a8f0df1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20b1f2c3ff4727dc8b69a0fa8f198c9e7ed4023c28d92f14444bc936268f99d3 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.27.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4419822ea192b407e70a881de938093d26910ca8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e86b4fe7e53a4339e5852aef5d300dec24e7752bf824842a9a5e63b359f569df +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.27.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..68565e9f975b094d7a7d0677c357529178c571e1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e21bf87a95613437c41863db169693faa1f13ca895fa81967b30c609a3ae9857 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.27.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2a1383276b65edbfdc3cd74014279b9c8e55335 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:928905773c1e29656e3433a90bed605032f9f972594139cc852e9cd089a939d7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..16491481741cdd624c54de60f68a797016d15ff8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4188cc9b81d6a5e6cbd6c430a592efa57e6aa3d23125d4bdbaeb1202c1cab51 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e46b23a922029426bd97838b2d2160c9679a52ee --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fc9e6f5154c866ed789f78ddd6e3059646c38f811d6d3004a787244da8db418 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e2a777692541d42a0c5a08e3cd0157f0ef26a17 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73f92cbdc6d070ce82dd23f0798fdf0a0e1f75bd99febbcd79bf9552e6424d83 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8065fb239f181edc0a0a96cc62c1e9ac4d2b28c5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ac779712c3e4391f530232dd53c3d0ad8e6dc1d6806e16bf651c76c09e65254 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2901946680020cc9594428f6a9cce546525ac6b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23aff22ecf631c66576bd8a40d680934a1976cc9ea3631fd91c7fd715efe73a1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f640f0673cc235a6972e80adb6703cc61e757721 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59630b8af0fdb812d777121a841223c46d7d55f1b048cfbacf67f52f0fc13a61 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1fb88752407a020354d28657e39e4b227166d91f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8f58072925716a0809b34179e32c5df37494895a0fc470a538884de89b33629 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f1f57cb4301ebb7d672a3a16672eeec8ce0bd55 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d44eaec8082426f509d626f7bfc086a59f001718c0ea55721362765ca3637986 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.28.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..98035f5a0a7f345bd0d08229fb230cd390fdd83c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7836b7e41f87a9a2cf967ccf3e4fbb4c345412165bf5993f7e5c6abaf741ef3 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.28.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4accc2526270ea79891f0a913ea21f5c8ae0f29 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c5fc481204126b049ff023a28f00843b188865f2e0d449d89894f9463c72a9d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.28.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b51c69fac89b062368dcecbc0ef0100ee07ece5b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a3ebb4ffee92dfb79008672cbc451246c9a0d8e4e7d1586acd175d3f5c221cb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.28.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d395ed126b796aa08f23defc5b72484098e5446f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aea65f2a98be1107d262af6943b108d13a0bc369c503f9a8e36354649391e4af +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..96efab3c2116071726f497d6ef7a0263a0868cc7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c6fc4dea345018486c46fc97f8e1504d3cf9cffd53960989a003747b84b511d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dece0b35887cc3b3c8f82fe564d96c1a29808e6f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a9c0fcaacde44263b76519fd9893d4d0195f9f2f85be5dd6b934865363a3582 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8316e38544eb7befcea0048b9f03e3786cfb8797 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca9de7bb1265a2fbe47f0789809a21edd1802a1ccc38a673e64b3c030f3f602a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5638f2d1433451fcbdb7d33b3c5eb16677758d44 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d3d19f19f6683e858e71e6399e1b58f200222ea60f12ba3c83f0d0f9675fe92 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4932db5e76ca0a21b9809c4357379e19aa7eb785 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74a7bbd657135b5bf265bf82b97a22729976c1e050933f5ace8acb8aaea86f5e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae7119c27d4555fa06576c02c7bf643023f68a8a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:598576cb8899ec90773b502866aa4fc13c45e9f0be96b366906b5ebdbf32790b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c7566baecedb27e5b34ec6aa16979cc60642356 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d5780199cd25b03a6012484a5bef999f6f23cb218b97649c043896196284b6a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1fa2b6cf2e6c97bba30c73d79f491313f94c912d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51850fabbabc193192a229fa048ff8e6224f43e79df4be5f91ef699c84334e62 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.29.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..86803bdc09ce5f3eb76f7ab4fed8cc5c2ef46647 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:667acccf4c5d10975b205fb83cd7722ef5e90de64e314223e099dfd6dc5f5562 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.29.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9465557cdde4a6ae6cd6bcda793093295b7d7011 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9fdd3da07a1357ff29f514637af3382b588878971c70bc4a2dd4ca932aec5ef +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.29.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0afb1f06f15f6d52276a264826a4ca99a3b774cc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29e727b6c600efb1209692a414395d37af36bec1d2eba585c4776d023f802604 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.29.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9d2a87d3c74d0610679cb07307dcbc2f9ae9ab0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b4a689a03d175fc3f1c446256b2567fbf5b699296ab55e5fbdc9b51bd18819e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c810a2d9e168c893c6af663a5847ef8c90fde5c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b2855d094104ba38ff6223941f32c47228888aef5a618bc11ba1133079912e9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e2a47d52b46b3191e24978f15cb1dbaaf4c4642 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05e5b4cd2644b7eb630a7a79d4186fe4f56479ef07d0e595b8eda96f44967472 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3284f770d7a81a39b5e127b26325cc8831704a1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7604193dfeec0c3c1b2dd06eff1320388bc786ba5f00c6d3c9aca7366973d68f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..052ec6ecf054c8c5b4c313b71a36f6e59e5f1c1d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce4bfa6e95ced39a132fcdd2148bacf0ad7b29799dab4eb274494723e1c0aeea +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..507c4aad3445cdc04e809c2e5dd2575f180e6070 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fefa1d5ecb9f2f1276e401ce75b4ed642d9da0585a096038c0e45e454142a46 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aab7a9fdb48ee270e46a6cb40b646b0309ae46c4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5aec63d954c9b91e5430f6c027aa323a6e62ef9fd44501beeae3d0514cc1645 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc20c5015196df5591c649bc2b7b09c811e580d4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f955721ed856bb95454f4951dfca8fc78078027239680007c11eaa5bc0c66b16 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab127fa09ec939756ee12a30e2a25c7539c905c5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ddaa043a116ad1e78ca5ff504c645443fd7fbaac024ecebcaa39b043749a7e3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.3.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e7cc3df7add9a80077d305de9841fbde4b952f6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01ab1b947539c2e8244cf3063f21d3e1130076ceb827c8f48749e82657909f0e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.3.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5926966f373031f66bc0f3f60ba09ef43da6588 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9256d9aec002e2609bda64e1fdba0424268279d0e515625b737e826054a542d9 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.3.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..336e86af3fa1d6111c95192389968fe9a97a0828 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b51ff16325cd3556dffedf03c7f32268e22845467a48425adfb6edd477868d77 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.3.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..196d29e1ae5645c858f48fdb89a7159df62ee076 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cba1953f2693837071ad5695579e33d7c64456fb889a4dfda37b234eb3769d8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b10f03befd079d07d8049a10b451aa2ccc076aea --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd6f0e2c408afb55e292fedd2733de1722bf7ea47468f81e6cf9b9a0475f71d9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d4f48bb68f0411f28f8d4589ceadd68153339e3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8a55a22da4ffb39a94715108f6dbbfcbb9c5c872dbb3b7b0814430bae56cddc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6554f25b63def2062adaf9d4a51aca18be5f80d6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e67646ff8ca9699bc561ce8a29ce5f6aa8ae41d612991adf248b0b527109d916 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..249d4f1dda374a6e1dcfa870b15e30adef230e62 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77a5065d31771bdc8617d8487299172dd920087b50ffc9c4a166f5b6239b87f6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..09b0b1d81cf7785a03f398c33f2ff8f77b692f20 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2440ce34f25a1d04b85e80ed48e0af272c340c2b96108829c957ed97077f3756 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b506030df902a9ed1445fecc0e02bc80ad340c7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab139412324d25984eb541884a3fa95efe2801eba7edd69fc42d48f77aaebceb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ca7669cc2762cff8b2a87b6d45c62a3efe01f1c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d62fac78f94f5a697af8a9f3e629e9ab02f0e374f283d7113a732da861f8fd3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5775b4a893c380b77461f673ae848f607597cfc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d42577384312b9d09f9085669658b8aad7202ae7bdc47e960c4d20f55745e1f6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.30.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..406e1b5d8113f4e00957b81fdb2f5ece762bd301 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07036a3b038d4800a1b92b85b55fcb176eeb9e548798342d33fd67c881bd8c4e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.30.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..993efb7b7b8865a34a4216f54bcbe74a70599734 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80b9932131ec1f2cbf68107a46a9d16b4be91ebeb91587782d30d27f5e7b65f9 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.30.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd374426376887bc24ba95ff8f09f9349a04240f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df4cc00b27894da7bb1b2dbf119c3f93e54a198549b60ac8259100798c943550 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.30.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0836745b29ef019cd8b54045d690560536411165 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21c6d0136a6992ebb7c897972ca20902294b8420e97e039a1467d86e3a95d8c1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..eeaead31fdaae77ecde9f9e978ed2f06d6f67645 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bba3cbf8764c47cb817c0865499307fa91ca0175ec68261bdf07f3901f0dd9fe +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b9dc29d0c8d83c68a92bc46d49db69dcd165b19 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b5bda06acfcc58f2bf9a3e64a32eb9db7d7cdbc476606df344e2f5608688d71 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d5f544d33464abd4c355f0a8c4e91dbdb616101 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:462a01b14d6ac8d992d7fedb18202286aeedf6ed1c53f583b378131693ac42b1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c7a077a23c3fbf69d1e9ca1d4cfbb080908c5e9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff61009f556e6c1710d65928c5a891a18bc898c90a362a6dfd9f175e6065e4e8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..65fbbf65bff6da890a5397f70df4feabec6df269 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:207f0534552443f21e5c92c790d2a6dc3369053296611c79d69eafbbe8d491cb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca4336611152ce0a7077f551c98456a2859c278c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cb908ff9efdb35daa68bc5513d8bca09f4902c324fc14867187f5b963de01f3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..91bf1268e5b0cfc219840b371d09669921cc8f9e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e71fc8ed9de3a6d582370b66dff3e718e50fd226d363ecbed09b1292ca19f023 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..940cda2395f072cf0e963e588a8fc27a239739d6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88c9293f8ce441d852f5f4611951cbbcd2e830670b84f605c7d238453ebc396a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.31.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..200453ba53dfc9a306044244661a4881afe12604 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:409192c2e6de694704faba2e3aeb4fd9d26ecc59e0ced29f7ac7d2b4c0df8bb1 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.31.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..51899a410257821db4e3df362ef9c8f11826991d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:229f5fd22f5642236a8035a90423e9c11fef86c815991a0cbaa68ddeb7bd5a24 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.31.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f8bfbeedfed441853147ad06c09dd6ab0a7a865 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a30aa5f986d18d2913d4b526ac2bbb555b6acc77f9512132303748319f3ccbf0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.31.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6fcc3549e8c932564becf6700fb157ed83610dfe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3833878c88db6765adbe91d071af02ffbad653c02f1c92317e6c6780464c9a94 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..383fb367743238171d8535f225338015b9cd5726 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b39c02e7fa847931aa849fefe01074df5bc181d4018f0576dbfa9a9ea29354b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e5037fc15cccf0e6c16790ee899bcb1cd76da92 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f83c24a6ad9cda3e6dd79ff5e832dcec20c0b8e21c02746b8223add0bcb12f4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a5ce2071e43ba460a07356e6693dd050e23889c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b45110bd50ff31bafbe74b6fc8d51b370d696ec2c3b9d21aae4c1813af733384 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..022c40591a3da059a3699509c85febeab7b92b4d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3c84197ba6ce1ab797f3c0216f30d103fcbb8e9d753f4e7a146bda195bf318e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb99c45720dec6bdd13af9be78df512f438d3397 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4316249265d786d3c7872b96b70dc9d68097c62ebbc9a11f80a0bad47099d88e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..13c38cfdb27bf0064ad38e98e250618659f274ed --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a067239265119049cdc247aa115626f4f7031d2d27ba473927ef461dae1254b8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9769c3967930fb279a453f81990b50e8c15990b6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43d8b71af9aa83ba312bf1ce26d2d0a8e6c7307fd8ce59902f05a26b7ff25a2a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf21ef4f73f0f94d8765baf90f7810cb0a7989d6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a101a46d5e6ad0cd1b1ce9115270fe6cdbf0442af2bb367d314acf54e80d433a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.4.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..83886b39e79d7272ba71963a29f98953da34aed6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0654fbaa73c882ac1d16f3dfbf0167b53a959efabfee529e9f5ea56b7559ca1 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.4.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb03cf237efe1fd4d102eb8f1701691c5c4a01e1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dea0217ba5c659f15a517b0b68319cee1f0c8fb5c02bbf83400eabde0a7b885 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.4.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..706bb69aac1a1f7080884a313dfb84f0204f9d42 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ac13e6cfb5c23cf33cd1a7352fde6fd703549d6f8790bc008392c362c8de1a3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.4.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d46f5d05eda374c0b242d712d9544d8ae30eae45 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cfb50b34c1d3e728a4a765c79af07a421c61b2c076cc04324971bea3060cd9e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ef719f8f2c775fefb58a39dfe91d8c3ade2e461 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e7651ae3a05de534ba612819a4aa03f0e857ae94eb04280bfa6194a32348577 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..719e737c4b2994535287ed6c0e8efa37504897e3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da5f4ef22c601b3bf5327d97773fdb3ce84e213d5a39633760c9c0cd8390ac9e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebf8dcfecf7a2e5aed0bfd9186a218b43b07a6b8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93bc612c863b86c6571aef63a01957a88181e562df4a8e741d5001e3dd46d765 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..74298e1b76b3a0f6c6284507b326d65a51a8223e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f152ced606bc894eaa846f4c7cb1255790b8b4056a7a8a3966285cc4bb772172 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..56ad0ab6a7b4e8791e80af3ceffa80f5570fa0fe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45a4624e520666a11de6c137f4b677fd5b06f488cf856ef658398a3a2ace80fa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e687d0ab398d0d3d0fde3a0cbe4f32658c91aaf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d3ab4452800af6d2c353e752c10e61fcbcaa2a034f3f9040e06810ecf8a1231 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc33bcafcf1d9c9081686264816de9f315c6b3e9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6e18116e9be9841a0b31da02608dbfa69e88c3d031d47f3f48d01ce5b22092f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb83676f81af12ccfbd6c89ad67228db21495f6a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ad057b9d492ca4819189633b34fdd4b757b5aa574d5637051038157dc0e318a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.5.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1999af221f7f1191fc67134c456aa52df295c180 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdf8fb8ab128142fdfcbdfff2dc49db9dc8704658a286b9fd56f68c70f61f158 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.5.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a44a6fc33deafcd5aebb24ef90cb6aebb54f7fe9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51d5b59a411da999dc191c3f731f2b801f2c2b1f07035a5de221acaa099c50b1 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.5.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fef11b9a9bb24fabd31d657d17fd1dc60d61c5b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6cab86ab0423690d20834c0b07ac6a635a956b005e89f32c7d694c8a060cee5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.5.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c8300e269bc039aeeed87476ba0fcdf6484fffa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44c50dfe71706558ad45083437f23913f284de8801c2ff490693734a5465c469 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b69047b7233cfa2308d2c2b8658a57bf3f942e05 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af3dba99406bb4d252f40217301e41df5d944e34a4e850da5db336c7e6adf264 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b11182cb5e62b3ff8da0c14038e96d157b577ab --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09aab65519259585f5f89e3574f42c039db42ee715558758528fba502f6f7589 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9aee7e10b49c9f02ed921c6509512c6e93bad8c0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a10b6a030c356bdb7c5e69d661f278bc3a970c3b94887ab936ed9ba788226af +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..633da4799a6fd14f3f72485f2fd208acb923facc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:479f954437efe88db3398661ffbfb7911b37cde8174592bb6116114ca7203eaf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6e3cc5ef08ed4a7d63ef1e20607933c3acbca36 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faff35723bd2a43e5ff9c66bd19a0d8ef2b22cb1e94200c6bf2b79497faf3b4e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bbbf17027dae711ad15efaab00d246106bc0cbd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56f126bd9dff1498488c5d1af44913e5e7fa5bf4a9d88421e1918347ce9f7395 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..04ebefe88ebeb1c838da13bd76e38b436104d185 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8bb8cd25a085d084e06b2d73c333252c888a9fc53711be17e16d7654de6d59a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..422ef2a462f6398d673d009ebfb21abeb89bf9e4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a75789f94fa253340f3220c87747018672762b0686aaba18551bd84c834f7da7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.6.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..61f77f1f67f07c338dd7b5ca182fd97e9bba6656 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:735088aea0c75f142b9ebde041609b955dbb0c7077b7003560af6813e8a40ad4 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.6.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc6ce9419394e6f039539231d2d03656439c2e8d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccee9bc1c9fd41e6c914bce6279dc2da4b38012b830b44cb6a016f8c828755ec +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.6.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..27e1330f503d00d4a83659c329b51ed6c119d6b8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:169bc2f0515c3ed68b7977b9d6b604d3fbfe0c346860654c132ca76e7898a370 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.6.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8ca13fcd5113373e82cfb8260af9a940102f938 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8193390d13f4b74ebf0976009253154bfd2387688c3b80b8937f650cb028f73 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a40d734660ee5040b4878a360b4d80981e6e4c6e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3733a3d6b0fc8c8d4b57d2836fb14fc6e330f2ac7961839affbc311399e9c79b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..93b7e6fa8462d78e19395f1101c3961dc78ea9bc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23462e3c31b419d46b31307735a78d3ec9898ea2e2d8cc6d91e363c8b8f97c3f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..640f6f86b8a9fd66b57bd57a6172d486993dbeac --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b238091a0593ba54df7994137fd31702f418eae888850f96dafaeda534806e3d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec4ca5f8082050dd64892e90d24bee60bc092fc6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f91804ff7d9166dbe9f9ee6e34f0606b9b2e1f927473097c3c843578756d8bbf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b32eec24c99b605b0c578464b1f388dba42c9aa2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4da639cc3424340ee785ace378ba8bb66a96d2b6a3725fe40caf7c1e297d3685 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..433d89f8c32bd1c5323e88572affb0d5f55c9e23 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd7496b3d137fc861453d24176f61a2b173092ae211108f016c5b8ab4222bdf8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a117a508cef2c962a0ef515614018f0fcf6d2435 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1341bada428117a34e40843261ab167fdc2c62ce0a80b09e92aa4d01803a8d0f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e7c15800ec25749fde5836e31d8790804ca808e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a899dff9bbfa7b887090a44ad14cb894a48c6ec2e97beaa496de64a93b4c40bc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.7.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3efbd3c89312ff4859b4d164b81c24c5978355a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd4fd1d11be0119c5f86f3905f2ed2882826f6e40fbdb9fe5af4a87132f3a942 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.7.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6313f4150ed09b9f424e68e1edaceac4310b1c10 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5c348953f5b48b801b56cffcad4e2922f534f8c43a8369125f90d5f7c6285f9 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.7.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b382520935c964be5d1d65c99a8413f8e346926 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9772dddf1258d930ab4cdf28a2e053b15a93718a91ae026f0310eabe52a6c3f2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.7.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a12aed705214c04677b5eca6d534b92f50757d6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb58a34518f791bcde67ec718cdcef2bec75725984d0a7020d0f43c2f93cece7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..71b6fb926cedddeb55d81ef2563054e52d4b282c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d532169e2a25c9dd3f8e4ef56889006936cca5ad1f16c124a73a296c1149048 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee080902211894ef2d2c774481907365f0b75afe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08222075d2e20c0277832e329d8f1b32dcfc3bf4db036ed6b532fc4eb27b9194 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..efba03bc4a8cb1e78a24c37ad5afcd2161f5640c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c5371350620599582da6e04e3e5e4f626c6d180a8662c50fb07e032e393c1ca +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb50efdf15fff26db17d2b433e201841ea85a3f0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4366a41c43955b3ca762e44896615a8bf8dcc6ef218be99b1eb7e87791d7d1b9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f978b0169a60d64b144fd6fc793e0d89c8898e9c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c3822b5a407236a0fd07b8e9d68527fed7b8fea49682b8f9bf3c3fe4710a581 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a823897fc1cc8498782400775114dc872a09d2e5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09c1da897a2ed747f78d80e0ebe8aea41d558ba1a96d2798e450667a4202f667 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d6ec1f14044fce9319b5ab8d78662e0a390cad1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:078d9a38432807e7a572b3399fd3dd6c33e29b87901c4486e4e692d1060eb900 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..db88d79f7662cc9a5b7c3b107f85644ce550cdc3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e1076bdc14e44b42be542ae5fa61d3de8a7f80ece9318e465f26382eaaae8e7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.8.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..172aa7695f92e55e6047a1cc1cc71a3a5a036d8b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bab91036d0506b1c9f36a84bf6185d319101b0536410148edbbb23d678875954 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.8.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..668a919c1044c2c8c0986183837ee35d97529931 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26e13bd0bcd199e3e78a4409cee8c9e81c364b003af36eebd810020107c5beb8 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.8.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ed167279511a28c599587981e7e0ab75620ed05 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8705df510e418214e23d3436ca3f9d4fb72e3f66bf8421bb292a2cb087c7a58 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.8.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c724685a1cf3a343715703ec32d6425074e427f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4c7212af9521a989633b086f78be90b343df5ce7472610bd23edb7b7e6bdfd0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c87f1468f88c92b06ca2a3eb248cd9141e39ea4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a81fa82e63242d470e0c319bb583a41676b73bd1379d67dfb32ec7706e3360b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e17f612ba5f57e2ace1b89859ab31af967d2121d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:975f521677d04bc3a618d0453f67aaec4bbcb26c8f9c3c2a2ae57319669a3ccb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..317ecf5d3307b11f4fafe39b8bfaf86fde0c2853 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14dabe647664963d552f4676102890ba451aa2944319e325b4d513119f57074b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a5765405f5282d3f2e9e3b6f331b640ab20b6d9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29582ae22add7f10aa108594d942e1d95f948b25a6e9593c95178cde40e464f5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e551e5a027f074cfafbe4264b0d31399b62cd25d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6ae579e8f023a50580996bb2deb4432726b0b0f4adf5868f28b04553c3da344 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7cc5b1f8e33874d2ac3fd20d27862b42d0aa3ad --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:790a641fc8526a91625ebc9ae1472de18e3954b281cbe0f9e836e5f7597b3bc9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..840d240156c6f0691110d6c0013b0f87437abc18 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03f6eb39a0d75a9cf6c9164e8f5036655f477fd48c4e3d7e047e8508e64e8d82 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e77e88c07cf06196a04e159529e7455a894039e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:292e900c13839493a9367173e74ac9c61782f39338f14638e4a788e4be94df90 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.9.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a49b8720edfc06530537ee4f423773758cc1d6de --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e003feb6fd5c6ff414aa9945fe0ad9d5dff962ea4a2e25bc8f0a80845df9f32 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.9.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0825a52a4c8f2d3f128955cc49e378bbd8048c21 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b57157700f728675f731662ca1a240bb511a83424c9652af0408b5ec946e0409 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.9.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..37bd5090617e7137048e02e648bb8b544b875b3d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ce70bfec5c35577dbbc45e5d5f1ec59aa5aef18d8389be43435c7008dcfd83d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.9.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba4ede2c6d2a1695fd80f5f48d322c9bced3cdc4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:445188d0904f8919ca822712cc4920da2ab8e7aba658f901ab53bc5bc38e0ed0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..82588ec7e33984a6e814ca04f24b3df584551d92 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff0dcf2b82615aad41724a3ea468ed073b4d2f08e3b26e3e164ac85587bb575f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e67558f07e4ff794f944ca35743820e635714290 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a26922645c54d9706cadea08e7db9a6a8b3345098e59f925c97ff483740f2c1a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..48580e1d554906de90beeb759fcf15f22ca5d77d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80a03f62aef87b00746ea74255cd95d3b47a6acb38e04346cf3846e7079076c2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..06409787d2bdb0b353c60d3446520b82da3ed9c1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c35249906966463679762d01ca02b05ba3d575689f3eb1d2d9d62a89d30cdef1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b80ab772e015106fe19ae139306fae71d5483512 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d81437e1e8f1eebaf478dbf1fe19610ce4fd03d83c7cd4823478c66c81e76da2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..33f326c808e9f35070a600c8ecf8b400aabdd7b1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4149917eb5c8e470be1144dfaf64583aad00e1c584ff5dd76f73160b351e89bc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e493ecdc46ed2c476e5725b0c7575f4360a8a80 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ca304f987c1b8e8772d0e7afc53a4d711b5c41f9fba75b45531888b7122cda8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a24ea07774258195a7ad8f1d7cff84eb778e4ea2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c39bbeb8aa8c496979ef9f84cb839e7db93ba1a2c9cd98e570d0d0a4552a4a9c +size 11395