Adding more results
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- params/phi/4/rnd_search_t_no_sched/comb_14/init/lm_head/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/lm_head/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc1/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc1/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc2/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc2/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.dense/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.dense/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.k_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.k_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.q_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.q_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.v_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.v_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc1/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc1/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc2/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc2/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.dense/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.dense/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.k_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.k_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.q_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.q_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.v_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.v_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc1/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc1/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc2/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc2/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.dense/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.dense/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.k_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.k_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.q_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.q_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.v_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.v_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc1/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc1/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc2/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc2/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.dense/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.dense/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.k_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.k_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.q_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.q_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.v_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.v_proj/_s.pt +3 -0
params/phi/4/rnd_search_t_no_sched/comb_14/init/lm_head/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:84c29e156c1ff233ab1d70419ed039b29645b55825ad507a9e5af986fd4ceae9
|
3 |
+
size 205955
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/lm_head/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a8d7e63717180534c58f1df9b06381cfd3ca80b9dfb68e61b777f2496c1711dd
|
3 |
+
size 205955
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0a0066f0ac3b9f53d5ca3a5d410c9c313cc9b99bd189385b6517994d15597cfa
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:811f616b83a030601ef6c897941c12b991d4970a5b9964a6befd5e44a8ba3203
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fd4f4238ba4fa01e22963f4e99a81d245dc99975ce01120e05238721ee29aa0e
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2a056ce7a4057b204f46eec7578f88c7a498e42928bf78e3778a324f237dc6e4
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5510f9e6a5677fc3e3dbe161edcb7ee668e64d289ae1dd524c45287d0c53e531
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cd1f0eaf1088c269df861f427722d35a799d190c836eb9c670c114b0f08edb12
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:23070b0d0b8b02db19317489e21df32a02ee497b1e224b06f2b11e42a00e44d6
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e220ba6a1c42784291442ce032e5c6822eff7227a058d91f7c100eec2594374b
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fbf022de901598164301274865e0373e1f65350c3552ec08e20647183d894d70
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c47934c05b7e58b7ccd278ef0fb06f4094a3c8cd86911c2322b5f57e494a6cd4
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a56fa8317a7c9196205fe45918f7a8b5a8c01d32f4e828d1a9dfe624eb5aef81
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2a8bd91f3e3da727bb4a1e83a3ac61713253245f98c6f2c1b9b667d6aa6983f3
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d0eca24cb0e0f4cb408ba4aed3e9a69e141a4f9f12a5520e751b5edb0278d80f
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e2ff3778de4ee3d7c5edbb639be7686fd1ef104d9bd8191a3d378abfa571a1e4
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4f542a58c128745ab6b230ea8a2cb0a1b04f2553fef5513e386b3250fbc9e6f7
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:76565d316ff44f1c2c36752e1f8b7af0eb1c39ed557fa5afa0ec33fafd9583d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a6390ce0b9a142b291eeb4a4718eafcc80cd37ba9caff4577eadc480b0e4c916
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5633316c7006f68e3ba369e2bd08717f55a7e0a14970ee8b74297a4ed8454ca2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:54d883e65b80cd900647773fe80c12ec3254491767fd2497a7c17052e698e3ab
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:276955c1a76d405a5844ba352b60a3a8ad591490df4bb1fccdd339d9ccb3ea9a
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b0631ddbc8975bd307a295b9a96c1a09a71c1e76c66cef055839ff396cc013d
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:91c5acea14c1c2979fbc5d69688a7bb55b7dcb0fe1bfbe97ce5a02e7aa75159e
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ba1aa037144ee28b062c5c33e684403d7c5d7cbeef26956dabecc2740dd45916
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e7db024be318696d08e6e56e0a1b6bd3e126b0c69d3b621b12317b45307cec9d
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3227b5ed040f6ae9beccfeb7c732d40a5c09e06a35ef64bd048b099b4af0d4e6
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1196d00b93a7f33666d98a04894303df8f967d5c0d8567f5211756067915d259
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c93edcd55ec26752967d6fcf5d45bc1f12414077157d62858593b7c298867886
|
3 |
+
size 11395
|