Adding more results
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- params/phi/6/rnd_search_t_no_sched/comb_7/init/lm_head/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/lm_head/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.0.mlp.fc1/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.0.mlp.fc1/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.0.mlp.fc2/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.0.mlp.fc2/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.dense/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.dense/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.k_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.k_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.q_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.q_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.v_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.v_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.1.mlp.fc1/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.1.mlp.fc1/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.1.mlp.fc2/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.1.mlp.fc2/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.dense/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.dense/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.k_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.k_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.q_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.q_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.v_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.v_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.10.mlp.fc1/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.10.mlp.fc1/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.10.mlp.fc2/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.10.mlp.fc2/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.dense/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.dense/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.k_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.k_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.q_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.q_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.v_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.v_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.11.mlp.fc1/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.11.mlp.fc1/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.11.mlp.fc2/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.11.mlp.fc2/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.dense/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.dense/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.k_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.k_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.q_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.q_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.v_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.v_proj/_s.pt +3 -0
params/phi/6/rnd_search_t_no_sched/comb_7/init/lm_head/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:84c29e156c1ff233ab1d70419ed039b29645b55825ad507a9e5af986fd4ceae9
|
3 |
+
size 205955
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/lm_head/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:64de37c178e23eecca26349b827acb74fa196e3ca61c869f782d662a368e274e
|
3 |
+
size 205955
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.0.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.0.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b193e6253378535c9748e5390860ca66caf28273d14e11f098e5906e35edd3eb
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.0.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.0.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:92c0c5390c2d7018cb00e44a4fd18f65fd0d984750f7603017680c22626221b8
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:89ff3f77de60b38ce58109f8ea4fb664222e76da8488a3288d2c1dc8f15becdf
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:478642760d9348ff718e0b3f51b946a8b1a1801c31d3cee71f5a37d3a287f45a
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:789ed424b7f0fb79b308a4d467113bc42be30eae5c6f06cfe68318866f3d7d6f
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9b9a1543678a8280175ac79e9e53b82bb2520b2e4cc5811399d484045bf79c34
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.1.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.1.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:73552436b7c9f3877b2163b508c726fc36adcfb213c858b6a231884ba6bbbd3d
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.1.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.1.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:65e151e69a84c45c79bbefa1c8862ddacd1a7774e7bac7269b452cefb4767677
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:61af82eb955110b70a6a6c6b2f515af78482ae2ce4bcd0c7f1d88e47ee87d5c4
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7bf39695fe1c3aa0ab2a33067e399ec0117288d3c68501def1df3c1489ae16e3
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1733b8d6205aab51b53802e7d043fceae25f4adeafc8b7d471c63e921dff333a
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7a6f7d0649b6c65bc4ed3d234ea814b7f065312ca6e2bd48296cfaf811dec9e2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.10.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.10.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:173a4db60218c0807bfc198b3d9447843911da13702aa6e34bb6a4577d9afdce
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.10.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.10.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:35799468fd13f3333e505dca1502acfcbe589cbe3cf8850825a963240ce6a918
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c7d2305a21a5710768c01246506a2d2964375038f5012ccb401b120a6d0166f0
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:243958c453dc5032b5cc0dbe272f77c121798e6f6103375972f80d8efcdd05f2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:400dfc744dae416fe003f48065e78b16ba80ad366251f27acc78ea26d1622ed5
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:10e7ef94b1cda599961f9de57123a0f902c6eb2a86fc4ca7c0490f284fde8de7
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.11.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.11.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bf82c3205aa1641ab03069bbbda0537121ea976623fe1f883a84fbfe931a364c
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.11.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.11.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4f480d34bdb27839dcba151d2c1c326ade486536404d41b8583058a8c4812374
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:83ef5e9f18c05f16b666d0562949d6f4c29ecb44a24ed67fdf209ffe6d454593
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3ea336ee5f8007acb9351b82cbd2e13b0ce19183ebfacaf2cd07e5ad51a08372
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ec4a679e0e19f47c4aed5f2ec42bd648b060caa82c0ee17cc0e364c9c2666c4c
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cbb0b624c336a33860f48309a60768119d8cabfc0d80a803436c454f806b0079
|
3 |
+
size 11395
|