Adding more results
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- params/phi/4/rnd_search_t_no_sched/comb_13/init/lm_head/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/lm_head/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.mlp.fc1/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.mlp.fc1/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.mlp.fc2/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.mlp.fc2/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.dense/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.dense/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.k_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.k_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.q_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.q_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.v_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.v_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.mlp.fc1/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.mlp.fc1/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.mlp.fc2/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.mlp.fc2/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.dense/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.dense/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.k_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.k_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.q_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.q_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.v_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.v_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.mlp.fc1/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.mlp.fc1/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.mlp.fc2/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.mlp.fc2/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.dense/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.dense/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.k_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.k_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.q_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.q_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.v_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.v_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.mlp.fc1/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.mlp.fc1/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.mlp.fc2/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.mlp.fc2/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.dense/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.dense/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.k_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.k_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.q_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.q_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.v_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.v_proj/_s.pt +3 -0
params/phi/4/rnd_search_t_no_sched/comb_13/init/lm_head/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:84c29e156c1ff233ab1d70419ed039b29645b55825ad507a9e5af986fd4ceae9
|
3 |
+
size 205955
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/lm_head/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3ce3b002eaf000c66ae3145b821bdd6a4b7af085210e55826833727d85659bfa
|
3 |
+
size 205955
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a5f6bed76c35690b07f17c167360bf3cd5cfde1da0c617435b8e80d2c0e424c9
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3b448d5ed6a23c25ec11ad89558970c6f50d2f891f2d66d9de4b8225b0de828d
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:46ed81b1a227b1aabfdffabed3206a05784226b1063b3b34bdd9ef63fa958aaa
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f25c30521a7642d6adda9cda68a781695da1189295a21c875cb4a8c94988ba3a
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bee212642bbe6f35f8a32871dd6bb3905a4977cf08e4e2ea4bed417202bd8bbf
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0167fdb8df4f24f0190bbf41d93d0579be3862507b25538f3d2d2faa33e39249
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:226a8c869aea5a40f52e8b64b8daa762f80fe9929b60e5af8d22acd91fd5a626
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab79fe35179faa043842a5958bb97bda8f9fd8a569c87404b88ba584e735a217
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fc6337a5cf1c32fa0368dec0a29f3c820c690d002873099caed4343498390fa3
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ed2b03685a0ea66ecbb02e503b42ae60a913bbf446cb1c68b70a2d25cbca3b85
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:defb0328ce5bfbf8f4ebc071768d057cf32ceed4b1a54c569d5d7553e18e586f
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:272ace44f903b3e3bc6bec1e35a18f831207b6b8f04a424c8224ac5deb36df75
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dc2c69ac87ef4c1033d079c74ca7c6b3f79183aad14d1e6a666d774f89141124
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:87224bcc9a640b3c08108e1c96867ce95320ed305700117f671801f750df71be
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1a6cf979f3837069290a8974649930063279b70d183f0de38989b9729252a740
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b1dea5dcba16b872d36670798f19275dfa58f89b69e72f3e7a418eabdd6bdfb5
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:41eacb42fe6fd3a6e2e892053af537dd3c7cbc7c9a4a4ed9761e0c126c8a3031
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bbfee50cc30356ed11b7316ab29a2087f06e137f8b3248a8dab0e6c2bb3c99fb
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:42585a82d4fe7f501ac0b6a94e0fd06ee836b14919e5a8f8906c54c44fa4045b
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f84995454b212c90523605ec53a3aac0ed86501c371f10d115db9a310804c5d4
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:93c3e2babbe240a14398f91eb5136840227d6c27c7521d5c46b49e62855b9b65
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d2470e9337da32e12b84a7e82ffdf4ab61bb65427e652c0d84e15934cc61c939
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4887967ee8a2aa484ebab22c2c19fbcffeb81be6816f9d29de62b91fdf58a1e3
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:628414013086f87eabbdac1cf7750f739171546136dd7c899b255da64408f969
|
3 |
+
size 11395
|