Adding more results
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- params/phi/5/rnd_search_t_no_sched/comb_14/init/lm_head/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/lm_head/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc1/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc1/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc2/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc2/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.dense/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.dense/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.k_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.k_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.q_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.q_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.v_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.v_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc1/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc1/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc2/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc2/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.dense/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.dense/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.k_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.k_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.q_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.q_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.v_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.v_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc1/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc1/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc2/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc2/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.dense/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.dense/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.k_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.k_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.q_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.q_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.v_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.v_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc1/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc1/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc2/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc2/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.dense/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.dense/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.k_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.k_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.q_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.q_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.v_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.v_proj/_s.pt +3 -0
params/phi/5/rnd_search_t_no_sched/comb_14/init/lm_head/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:84c29e156c1ff233ab1d70419ed039b29645b55825ad507a9e5af986fd4ceae9
|
3 |
+
size 205955
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/lm_head/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:40d9394d9235cd5769706d91057592735c3c8b60d50c810dc5fae009bd5f5ad0
|
3 |
+
size 205955
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c95ab0a0fac0c3790663c379fc8b1f5d32433b709d315476fcce7e82673cff1d
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:105fcb8b0a461ba4bff2e28fe0cffc1b65864cf83b27c79cbd2a50031116f0b8
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:45a85546214965257c8ff2dae25c2cb261a62a75314694427d46efd9bb87f00a
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:487e892c67a68173956a5c7a0ad114a1190f8e1cbf163073c9dd02e8f4002f2e
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a96ab906858e1c8dcd678959d29c13d5cee7963f4bdd4dd0958a9cf073654702
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4942b68d1960c44c4739c266082cc9f5950502d58b412dc6a7c8a7b0cbd0f9f6
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:24b80b55b47a0f94f6911f3ce9b3d063d30465c15dc6e3821e5f1b4bc0245d53
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7594ed6c5858fdbae17c3e781b35101064650e4c97f5462ce7c0666f50d14656
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ff2e0cab44aa33e118b58cd56d76da68f0a890ab00ca1e30d9d4676323e82661
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:894f496fc4b4ee5683a721b52d7650ba112c315cb1416cda46e615e1e33ffa34
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e34e684f1309efeab3b8fe831c4f9f666838155ff5e03b262cd3691eb1a18183
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3d2348fd8dc6df48383b4769704ffcb99a491f2146301e6fd6a3fdd97ac2243
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3770e04aa486686bf905a35c0496153b72733835ce1f0eb1328cfeb8a39550a2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6529ef5b3fe348fb44dcec2ca6f8522fc3dadcc6ef26456b19b4352866456ef2
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:64971c60db904cb783dbb689cc842fc4e61cd4f17715397a1a7546c46e0d21fa
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f3eff245c2e0d9dbedecff6223acd46e9d772b43d2554aa853bc4dfcd94fdbd0
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b88cbbd3653e14c7894607f4b3a6f393426b16cfefe3458dfd0b0a2c9d0e70ab
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7c6ed770741b62cbab8cfb5692c840d51cc6cc800d4807458551cd1eaf6c8323
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b01acd04eda65c9306abd957c08b06c1a8176b8f9cd094686105e6e5c5f4f8d
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2d613a080ccb37fb09ed83637ade07f2c7eb6dea94c374aaa2465180156efca6
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:82f6a86590531891dd5c5d18b774caa51bd14e4ab5d332dbf32bb5c0a677d4fc
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a172bebb560e39330ed1329b38b6806690a8e7455f9c5c921cbaffa99d38123c
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f41a95d6fde01cdd6d6a3dd636f66baf9e4d4ef382b86b9bc38e8d141a96fe40
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:da03da1f85837c3e2cac06fd1ba505600483ba1b81d3736d87b950ad8c94f4ed
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:47554b93cbbfc87c93aa9d75af7d952cf546b6149552e971390ea5347fa0d556
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f2349fc6f1c5c1cb8d138ebb98f4171b5d044b13e3264308c48951d209a89336
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:95ea3cd4c3da960b83f1a6618a3a143118bd824f21f3fb05161d271f086d481d
|
3 |
+
size 11395
|