Adding more results
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- params/phi/8/rnd_search_t_no_sched/comb_3/init/lm_head/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/lm_head/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc1/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc1/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc2/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc2/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.dense/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.dense/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.k_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.k_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.q_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.q_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.v_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.v_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc1/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc1/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc2/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc2/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.dense/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.dense/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.k_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.k_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.q_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.q_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.v_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.v_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc1/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc1/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc2/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc2/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.dense/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.dense/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.k_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.k_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.q_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.q_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.v_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.v_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc1/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc1/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc2/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc2/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.dense/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.dense/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.k_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.k_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.q_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.q_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.v_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.v_proj/_s.pt +3 -0
params/phi/8/rnd_search_t_no_sched/comb_3/init/lm_head/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:84c29e156c1ff233ab1d70419ed039b29645b55825ad507a9e5af986fd4ceae9
|
3 |
+
size 205955
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/lm_head/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:10ee53abb27a2ece42f027fcbe86fac973f86a0212225dc0fbadb18b7caabb82
|
3 |
+
size 205955
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9f9acebd16d2e1a455d56883d03d0580245d76cb7945f0af48c2b6781173e447
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ba73af99613bf3b6b5279688869dcf1a36ffdf04b486d8e8f279884043fad140
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:da8526f7b4237684b523a6da5f731c6ba7984f6e1227ec6e4bb3c1fbffd050aa
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df1231b4d1eb09c7d5893940bc34e7878591ca8aa6e358b63e4e85ba02b525e6
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9baa93e2598360d51d4f61907c03fcca86f92675feef43fcadb6847e5592b36c
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fc0b5205ae9ab01c599b93a63bec73ce61a8884df01f566259c9dfa7cb82c48f
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:42fda4c880b477014b1c320920da812818e2f7f6a9effccbe30f7b928bed59ba
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:24871f8b42ac7f5ae74aa8879066cf0ffcc52c1dc3de051e94e9d46f1e6fe5b6
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ebba9812b20e36dea3895d2bca4268ab423f671e70873e0063e19d5b2e0a1fe6
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cabcc04ae325744f5aef58db94913fb0d1cc4374acd19dfc2f610848cbbc37fa
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e439de20722865e3c4f7b26818a293486b70f1ff0ad6d6a055ee84237ba06508
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ad5af192dcdb31bf53b9e690b0a2686921be93fe4bcbaad5abe8619db0c9e338
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e0efb4607fc3b423285fc0ce6df4f274847126860e24d12dab8babc76353976f
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7b056bc316d24b6dfbda28bc6e0f58962a6a71a77c85bf3676c313657bae1c3e
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:edf69ca6b8d52e7e1765f50a18c9e86e58c86b891489510dd9531441efecde0e
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ed80ad01dd16b6992c8597143770a7fe8ad8cf575e5a1528db38b1f139b911d3
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:040ee7ba864c9fd18a3d82d0975cb588b6927a88990bef069e31528df6b2b478
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:934c60016fb070c7b3bb8ad9aa46481679f79cd714bc065cfce2fb9cb705a78e
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:840719bdd2f1042d6cfed57e500e4d3e6e47c9dfb2547562c730f0ed3e4b125c
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f9a00d35309374520fd054179c3bceb52f6960539fcb3c10b681caebe00a89d
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:082e28085935d38a82d47edd923af3843551d3f3c7fb4662c7b1016a4a491e72
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4e3e5b37eb2b5eec1939c691a00cfea5ffd7d2f30f94d6b53b63576b3f9c3c6a
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:943f814df676dd4925ceb881694201580f45be9572de47843d0313ed8d75c911
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8f94049423ef07aac3f9c7a1cdb50a07e369c5859ce7d62ff5d662e5ba1619da
|
3 |
+
size 11395
|