Adding more results
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- params/phi/4/rnd_search_t_no_sched/comb_11/init/lm_head/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/lm_head/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc1/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc1/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc2/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc2/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.dense/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.dense/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.k_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.k_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.q_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.q_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.v_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.v_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc1/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc1/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc2/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc2/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.dense/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.dense/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.k_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.k_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.q_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.q_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.v_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.v_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc1/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc1/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc2/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc2/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.dense/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.dense/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.k_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.k_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.q_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.q_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.v_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.v_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc1/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc1/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc2/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc2/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.dense/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.dense/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.k_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.k_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.q_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.q_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.v_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.v_proj/_s.pt +3 -0
params/phi/4/rnd_search_t_no_sched/comb_11/init/lm_head/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:84c29e156c1ff233ab1d70419ed039b29645b55825ad507a9e5af986fd4ceae9
|
3 |
+
size 205955
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/lm_head/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a63d286686cef7e1a88219cb19f9019238d6b80fe317010ecfaea17b653511be
|
3 |
+
size 205955
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:175063cffcd0fe3849bf8e0c30a95aefbf2004ec5e9d3b0b5ccab5a69c2123c4
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4abaf283c24b88d4a5bd1c856d0dcf1ae90a20d6a0389272196dd2fa9fc077e1
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a8dea1bfa2b97fa8454b5f5056ae4511d1aee5ecc573d4f1c32ddfe1ffdcf098
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:09b1c4932597015532f16d30b59376904f67fdb2a733b585b72ff1d24c44ed3e
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e4f41bacb44dd2cc12c63ec81b4c3fb202a17625aafaffbadfe16d4bba759a0f
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:27c189dc3a70501cfe33d08adb18ae3c940bbf4365ba9036eb0a7961e789bb11
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7d06db3becaee64ce237d335d8275ba5bd5943af7c6d2bdb066b137ba2734d72
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9d0ff9406289fbc46fb0d1fafb11c9f59a70e59ce1c406ba7e4c2edb1b31e803
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d4c34def52b9d74a55b6a7ee209a923ccfa2b9acd4f64ffc82e8e1ef3f1e0110
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:828c11aeaa87617168d7f5d27b7fadf38061447215f3f20e6475aaddd2c7a01b
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a6b3a1c017641958de8c7ba27de0163f4f7ded0d42881a58aaf8bbc6d615368c
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a8128a89902ce98fbd0912798b7c39da2c55282948f1a8d7644947d23be1c00d
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:beb6bbed83b4eb7bd4e733fbcb241a41ff61483d91d2588bdb70a1e56428786c
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5abc67005a5a1b831938e9bb7eeb47523f5570d1a95d892b6da2f6c656f2b306
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:db852d18abc43d31e59d9b81491e1b861cbba5c2561e1bd12d7e423e1e38e596
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df178fdf5e1f819ecb94eb4d7c42962793ef060a2da68c8b365dbc17f114ada2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1220e2ce344ec474651ebd6ea3d3f89a7ae957d25a00b3b71593f1cb9d366ce9
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:498290234d06cec336ee9d1d3bfc0b7c2cd1d60b8d4b6f4a234de76a7af32dfa
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:52d52aa054ed98c970c82944694cc6381d9e19e8f92b39a9c1f91ce1b8565241
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2268137a0c09e1a6edde009b8ab13376b9a85afd9d47cf55469e4eaa530b8a00
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ba26e06fe7b3941a2708ec1ac604877026c88e2bf581fada3c5978c22560f98e
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6f01d070e594a6faa8b85195e9e7c97479a0249a27ec3fe747a682541eda3ebb
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:38f96e425a7a89cb49faae2d1670643efedf4eaf371e3bb7214d58683cbdaced
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f6dd986efc7ad61d1c9e8df7bff4b95507bdd205f826afdd69495932a82e5321
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a5f452b5524db2b5bb608d4ad566076ce75925a8132372224b9fe4fd6e8f041d
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8822852342fb2a912ff50da0476020157b6ac8e8ccb15bb7ce88672f01704619
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:89e0b4a39c31538b92729ed27ddcfcff4647c5b32ccddf9d8a971a4d46a964a2
|
3 |
+
size 11395
|