Adding more results
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- params/phi/7/rnd_search_t_no_sched/comb_3/init/lm_head/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/lm_head/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc1/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc1/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc2/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc2/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.dense/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.dense/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.k_proj/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.k_proj/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.q_proj/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.q_proj/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.v_proj/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.v_proj/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc1/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc1/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc2/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc2/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.dense/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.dense/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.k_proj/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.k_proj/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.q_proj/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.q_proj/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.v_proj/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.v_proj/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc1/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc1/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc2/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc2/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.dense/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.dense/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.k_proj/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.k_proj/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.q_proj/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.q_proj/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.v_proj/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.v_proj/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc1/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc1/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc2/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc2/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.dense/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.dense/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.k_proj/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.k_proj/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.q_proj/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.q_proj/_s.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.v_proj/_0.pt +3 -0
- params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.v_proj/_s.pt +3 -0
params/phi/7/rnd_search_t_no_sched/comb_3/init/lm_head/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:84c29e156c1ff233ab1d70419ed039b29645b55825ad507a9e5af986fd4ceae9
|
3 |
+
size 205955
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/lm_head/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aeecceb0b4ecb840b2cc1b2b659eb37e3c2300723ceef642a44aa5a816fa957e
|
3 |
+
size 205955
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cc079f36b6a96c357c9ea2fd4027b4ba59fe9b5e7e268e49820c59688bc14dba
|
3 |
+
size 42115
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:068e4705776f11d24df522db7bdef67e9c1d9184668544d6ea7816e3144775bd
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f90cfeea5c7561b1d68e9d9d7636df799a1bfc20182b8f77f6119acc3c5bb4d8
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c4f2a2336fa01a987be4e9534b4ebc239a385d7cab4677a6b7dc47746a72e36a
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:95ce32065362fc511cb115003b25ea66508859592cefd0024bcead150393aa1d
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2061c0defbd69b909ccd861ff14da454c147d7e5b91ddcf6fae98c8f56e0f237
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:770ffcd09f101e0d0bcdabf48fc864cbfee46519f436caa05e1e0824990649c0
|
3 |
+
size 42115
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:db978715f7f7ff610e9638c9166d441389531cca442086b32afe8f4dce1689b2
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bc3f97972a26d93e5f59e0e6005d858e41cc712bb7bba711a5b75bcd3ec9a715
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:16a10ae05b6be1160aec096e180d29a2891ae99de280ef533ed4259932e3a648
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:77ad9c212ad0f123dd8c65454a778d94cc06db3533422df976009b8ac18dfb2b
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:851cbdc9ad40ae2cd6acb01ed8dff3722ec86370baffa5946309280292247e53
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dbbad8918e764fd9d09e82e1d05899be7daabc180aa34163085262912fcee962
|
3 |
+
size 42115
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0dc926d1acc06214d011a3f21170a5bf76437946b41b07c892bfe80db030bcfa
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df6a0769b6f7623368166575574a60aed06981dac7ba56273ee08fe215f1ab7a
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f429acae8e9a91a4164f024ad8211a0efd94b1a06fa0471d43e1c149924c1e52
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:658ab64d2b9c93637a82cf67e76e60eb58b3e7223609fdf21091f99571b04752
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ed8a7110c9d014c550032bdb4873913dc4130bc55e04a423efbef0ae04d67e3e
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b9be5057b274f5f33f3b7be9a2a824333dbf1539ee07e51760f3dea9a131302b
|
3 |
+
size 42115
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:252b9ed80b31066c0c1626cf916bed78afeccf721a794171c935e41122327be2
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:48b3c6b16097dc76757eed9ff94a83a2b32fff1614933b2d70609494cebaa03b
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4162e296ed2422b834f812167c90b41809a620b1e650f857a4ab0524d8dc0ff0
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ce0b5b91411a3096bd60518ca0ac7667009a86f6c2e1d5c4326d5da36ec1182
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/7/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:477477c23827e2c285bb7a992b14d5cc6a8d5aeb6089f4c2bd522c16846ba338
|
3 |
+
size 11395
|