Adding more results
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- params/phi/8/rnd_search_t_no_sched/comb_9/init/lm_head/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/lm_head/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.0.mlp.fc1/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.0.mlp.fc1/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.0.mlp.fc2/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.0.mlp.fc2/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.0.self_attn.dense/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.0.self_attn.dense/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.0.self_attn.k_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.0.self_attn.k_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.0.self_attn.q_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.0.self_attn.q_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.0.self_attn.v_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.0.self_attn.v_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.1.mlp.fc1/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.1.mlp.fc1/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.1.mlp.fc2/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.1.mlp.fc2/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.1.self_attn.dense/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.1.self_attn.dense/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.1.self_attn.k_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.1.self_attn.k_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.1.self_attn.q_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.1.self_attn.q_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.1.self_attn.v_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.1.self_attn.v_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.10.mlp.fc1/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.10.mlp.fc1/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.10.mlp.fc2/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.10.mlp.fc2/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.10.self_attn.dense/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.10.self_attn.dense/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.10.self_attn.k_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.10.self_attn.k_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.10.self_attn.q_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.10.self_attn.q_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.10.self_attn.v_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.10.self_attn.v_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.11.mlp.fc1/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.11.mlp.fc1/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.11.mlp.fc2/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.11.mlp.fc2/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.11.self_attn.dense/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.11.self_attn.dense/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.11.self_attn.k_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.11.self_attn.k_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.11.self_attn.q_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.11.self_attn.q_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.11.self_attn.v_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.11.self_attn.v_proj/_s.pt +3 -0
params/phi/8/rnd_search_t_no_sched/comb_9/init/lm_head/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c5d61f55b645d37e73c2cb89d7d3d528f312c1f63300252529cba126b3783b7f
|
3 |
+
size 205955
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/lm_head/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a4482818bfe48d31b525765139147606ebcc5ee7379efe40eb9e97eee96bf9d2
|
3 |
+
size 205955
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.0.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b5f14c3a59536b1d523b319bd5a309edd9a7b9a0f8268e879e415e2f39a9ee47
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.0.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c42225f3d1fcdb24ba882666dbbb128d551b284892566cdc156d3785ab825fa8
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.0.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:64d718026220f9e271ac352d5ddaa4bb6d6cb5a2268f87b8e8fe81435e405583
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.0.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2597343d55ae7bd5f6c8d8b3a5730bf979a0f25a2432d4986d7d50dd11943035
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.0.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:77b0d9b00a5fd01f9a8d77b996335142ad4b11afac9e8cfd1c5d52122dbec4ad
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.0.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8d6c559fc06a909bc13f215b60676b09c4a55a301d1c8746d21767a17a4e9ada
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.0.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aabc56625b2d90c17b9348677ae1798e4c134e2b800ac2178f25acfd864cc648
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.0.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c3c74d27aa7a1e56553538fcf10f14df0ee83fe109782c43fb529f0b93d9ef5
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.0.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4af58a81abd28e394daed5e1a6e4e3b5887461e36b88cb6056a767ec02f92618
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.0.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:73507237dd1e6bc17d4d64a7451aee85fdb72a167d4408674daede6fbbecee51
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.0.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:557c776ca02287c97f1295e1a5a5b08da3a70512761cf44c26c51e4c74e747fd
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.0.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9a6e8e9d4468b94fa6dfbb934eb77bc88b5153a9b8eb70fd50ad46aaa08b6404
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.1.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:852d3b5d548d1fd15f7923d3dfe6f3c7836a6179c1935b377854daebf686ad2e
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.1.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7d745004a167b204aa9ef48a93c07c3168d9184009e0012e71633273cd0feb85
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.1.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b19a3faecb7428aa4c7e4e83d62fba8d0821de8449d9ddc9ef43270717414a9
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.1.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a64a277bfc825cffcfc61e2524b00ce83733503691f06f8adf3fb61fd41eeb2a
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.1.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:593a6da477bda4e6ce8a40af14cc0b6d3aa1ad16a9d730317dfe9810219fad04
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.1.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e0d0be0cba696b3a7f66c81d832c029db0ff5aa08d0ca288e596b465f9537a4f
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.1.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2ec38b6f62aed3f948f6d1cfb355653716f287bc5145db39bc650a6caf4938af
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.1.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:138ef98abd0c0bec35a4e8cc5635ab56cbb6bd637678ce20fe32f37e105392b8
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.1.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:83101740e39bb8b22c5a25776e1d43685a8396f314c815cd950d1af13220150b
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.1.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5bfd3ef7b5916d2ad55930f598a5c58d1cd224f21c5475b3563d8df676803b2f
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.1.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fdeda9e8fba26fc5357228c17305bce0862ca12f138d960cbcc4fc64641d392a
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.1.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1de5cab86394dfaa46524b87a6ed709570291aa163e73bde36cc7535ec7163ff
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.10.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:312ce302913eaedb099d04ef7079026fdacc4494304b9d69023eb1ad910329fe
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.10.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e793ec168e2a64e4465df82424c4baf9131d0e589cfaba6d559fe84aa17c82c9
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.10.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b845ce7e9fe6ba323baebdd3cedf29b03f846b5945663c19ad304f35180e092
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.10.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fa859d6c3cdd763de73ece0e2d7b98dfef6a764f5052fde61138d4a34044fc05
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.10.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:366c2290203e7fd154124da28b7d0cc62c50d28c14d27872d1625a3adff30abf
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.10.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e68d8c6a75a53c16bb354046b315ede4912c146a8dd0da02a594508f6ed88c4
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.10.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:93c7f94b377756f369e76658f7ecbdf3fdc781650821aedb3f7ffc3ae2b3d476
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.10.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9b67ff61565b74beaa00ba11930697eae6d5d08d1948f44f8ab3c7a877433ff7
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.10.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b8f1dff0fe1314db8801d640d40f076777cb8471c5d83985fd75e2043bed7420
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.10.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cdcd10ad82cf2323e0130bbc6da2767bd186d2e3efccc4c533e26b9c434b4daa
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.10.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6d01410214ad7ed42b089bd807fe8a4044bc87ab2c1c391a067615253b79268c
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.10.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8f5ea71583afd2b7e2b74908b32642d8b511d7efc0899124ad6c44b6cda6f272
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.11.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eef5f450bbf405a9fffaf2aa994401a7d211042e04c99c4acb0342c34397c821
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.11.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5a63d21cc6539bd813b82b5266c23d710f81631adfc55d66c3166537a2b8a592
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.11.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6f97acece1110c42d3817047fc5178cd73166edf121740ae0f006b610f8abdc4
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.11.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5d1ffed23feb6b0d7ce734420e28e1d9693261ce4b38ca92dec356453184fe4a
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.11.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3ac969357c8561ab6ad5c0550468a4794ab6d51e10c8c3460ad60e24f77ce07d
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.11.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3a60f9986760bad29b0dc94457304a90d066db2a6e32d46fc6eb78873bc483f9
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.11.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b8f2b0af41b91e7a13a6858b916ab673a1d147cc2c52f9aee2349a9053314c6
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.11.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cd393a78002579bb238e4573d81bf5797baa8596dd2ae8a76010de74cc66b679
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.11.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cd6c0d79397ae0d20eaf6dfe5a70cdedbf47e40caa7f1f906cbf665b0f1844b7
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.11.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2283cb06f112fe2fbcee18edb8e06e73231dc3ecd42f509399c701b4ba1f448f
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.11.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:de001b4a2913e1fc955fd3aaf4ef989826999c3c5657cca60baf3e4e7b581692
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_9/init/model.layers.11.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b1a6ef9eb85e9fa4c13980d01b9f34b142494f25554d0870a4cde3d853dd7ee4
|
3 |
+
size 11395
|