Adding more results
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- params/phi/5/rnd_search_t_no_sched/comb_12/init/lm_head/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/lm_head/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc1/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc1/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc2/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc2/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.dense/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.dense/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.k_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.k_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.q_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.q_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.v_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.v_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc1/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc1/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc2/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc2/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.dense/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.dense/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.k_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.k_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.q_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.q_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.v_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.v_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc1/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc1/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc2/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc2/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.dense/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.dense/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.k_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.k_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.q_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.q_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.v_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.v_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc1/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc1/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc2/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc2/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.dense/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.dense/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.k_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.k_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.q_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.q_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.v_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.v_proj/_s.pt +3 -0
params/phi/5/rnd_search_t_no_sched/comb_12/init/lm_head/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:84c29e156c1ff233ab1d70419ed039b29645b55825ad507a9e5af986fd4ceae9
|
3 |
+
size 205955
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/lm_head/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ad5c9dbdf0072eb4c311d7d92096acc64cb132642f955dbf777ae002b86e10c9
|
3 |
+
size 205955
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d5f9c1ba794bc4d06c4ff7e432b9472a0e2cb5451fcee6d8ae56faa7d455c92
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6169e9c81c81dc3586fb1d3641d837100d5e825908747e28ecc64678e71494ec
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ad434170f970f24a8789729a3b4f454761de155c02f9f53a613897530d2e1572
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d181bddc3652dc16a47861425e9b9a18d412ee1e605ef43d61dfa463355536dd
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5499d6f6b7967ca86515e223b3142e0fa192ed3887051e353dba9199be78041b
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0f052a53753f60e0bc1c7c9693b57344fede8bceaf87c31863644c488a8d1346
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:168b17fb2d1ae16455f99328b1e8668d0cdacf3999ce7ca3101dbd8e641dd3c1
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cf2334e24c9a43547f7aa2d09e603d96fb8e5460c3355eb9fd5ae42558afa7a8
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31ed5410a63c392e276de6b3c321cc95d6b8b8dcba50dbfc0f96c531979f01eb
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:faedb37314377c61ba997a695a820d3370988bfd8c0c7a8467d38ef21b8f7c8a
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:216bb38a61d3903d15654fd6c042cd87221acf915c9a57aa5831b71138a59988
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:431d1465bbbb5f056c15a12c39661264fa418bcc1dab47ad891d76d7459838d0
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4e5ffec0c80b43e1401a883a80c6a67c3bfeee01a2ff44e5bdbc877c02b0839e
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2392ce77e7eabd126f39f6abc21a47e570e4577952a418726d2cf950db60cfb6
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b142289942ce2659e33bb0616ec4e098031c66690ef72a1fdd73db30f61be366
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f6f62545d5ec2d4fe5f15e5c041403731f38783b9a77e14eaeb5ebd478745aa
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:30b59e804b34519a1ee348772b78128848d58719b8549ddddab66f9978ca4eaa
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7ed003974cb3548b4d15b4ced939f6eb5330dd4e0e58bb8aa611aa74aeeb5cdc
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67b21675cda363f1c74f2d49bcaabe4572c2272cc2566d799e895443799ab837
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3e1f7ab5d80f7da4d0456b6fa6e8931c46ea66b3618f4ece18dca167de9a7eed
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:36972739db2922d48ee517a7fd6e27283fca0e6a99978dc8f55e36e7d8df1dd0
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4422a26e29198781b621f540dfafc8ee6c91fc9277469496e00998168e8685d3
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:840f922ac4613e526b11a7012ebacad64eb5958834342e292719f2810dea9eb1
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a20201c55f2a848fcfff203ba836d1f17db2a733c065f17526c9a1e7e0e13d81
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0584bca5d48ca966a4c76c799f281c0512bc36a16423fc9aba21f610ea9729d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6a97852ec0005091d21f238644ebd6b391b268e8ad91be285653891b266a44d6
|
3 |
+
size 11395
|