Adding more results
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- params/phi/8/rnd_search_t_no_sched/comb_15/init/lm_head/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/lm_head/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.mlp.fc1/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.mlp.fc1/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.mlp.fc2/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.mlp.fc2/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.self_attn.dense/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.self_attn.dense/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.self_attn.k_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.self_attn.k_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.self_attn.q_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.self_attn.q_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.self_attn.v_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.self_attn.v_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.mlp.fc1/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.mlp.fc1/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.mlp.fc2/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.mlp.fc2/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.self_attn.dense/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.self_attn.dense/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.self_attn.k_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.self_attn.k_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.self_attn.q_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.self_attn.q_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.self_attn.v_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.self_attn.v_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.mlp.fc1/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.mlp.fc1/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.mlp.fc2/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.mlp.fc2/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.self_attn.dense/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.self_attn.dense/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.self_attn.k_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.self_attn.k_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.self_attn.q_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.self_attn.q_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.self_attn.v_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.self_attn.v_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.mlp.fc1/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.mlp.fc1/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.mlp.fc2/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.mlp.fc2/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.self_attn.dense/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.self_attn.dense/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.self_attn.k_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.self_attn.k_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.self_attn.q_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.self_attn.q_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.self_attn.v_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.self_attn.v_proj/_s.pt +3 -0
params/phi/8/rnd_search_t_no_sched/comb_15/init/lm_head/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d5c5ddb4ce569e2386bc734b66208dfefa3a05adfd8381899bdc065e9e3eda94
|
3 |
+
size 205955
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/lm_head/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:215778505ed325643e60dc1e131eda38c5d7c8735c7ad8ecafea17b6ce214111
|
3 |
+
size 205955
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e81ec5b466c031f1efb52b483d7bab61b70eb2e4fe06704dbdddce21e55f84ed
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0aaded01a5429e63649b26b3345c7a92be50200bdb3360c8fe84c9e7418c866c
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:06d24a6cda5b5055732900bbfbd32d6fb67b6dd610976a6ce2cccaca922fc9c0
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d22fd388fdc29ba5d7c6bd8925a165fa4680dc2634c2eb8c569ebfc3ed3f70a6
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5e4b6f99a181b562f97d46cd0fb8141f6bd103f635209d6fbc290e0ea26c1ae0
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:66ed43c565dc73e036c1e0d71b283e55bc4f28253603f6b19b90f6d26eaa93b2
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:72a9a10fb43c9beb5475a7a4b9796bb9d0ed787f22279909f896c64bdfda82af
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6aac7803fbd58680c132d111b62642b961361956dec22de80bcdb66d8b580142
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7309636e77e2159c9f78082410413db689a4287a06147067d7c8ccfccc615b1c
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:af5e87485dd1e84e69d28e5f06beee2abbe34dc72f641b610b254624856058fe
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.0.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:423ccb529b017a897b1dd77b9577390446122bc173963565c50bf7a84579d4b2
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e81ec5b466c031f1efb52b483d7bab61b70eb2e4fe06704dbdddce21e55f84ed
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ef352ef3dc04af4532570195fdb32d1b9c9d22c9fd45a35ef16b075765c6b1c5
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:11a249705b353d3ff61322f5c73f45c5d1b6bf8669806035430260c2436732b4
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:89aed12ecf1297be0440fe757ec65c3caf8efd504b638a7d9881c30837396ae6
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cc2dd1ca72d468a09abe4373224c92a92c537181a3b7db741adfc0107ebaf494
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:741f62050d7b981575232545dc3a37914e22c87e61ee302269e5ecfbe792d58c
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:585aa3dce6206056caff4a29121250111ff137d0383fed0d389db6b595028552
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:977f686229ad42e64aa76dada78ce2930a33ce9cb5e8b79892b0a7915daee779
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b04dc5bce2533665eaa6d23a0e5fb40f8212a37be2a362d033a7e2f9a6861f19
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:35196c94476d75a92a82f5941e265e7e3b5bf0d688acb19d2cd27ce4b9e1ef15
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.1.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:351ed68a600d5b347357d452b86cbf301726ff9ead0d21e11ad49cd2ba084506
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e81ec5b466c031f1efb52b483d7bab61b70eb2e4fe06704dbdddce21e55f84ed
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:73a669db38cdeb0537ae2690bd49964dc9abc909e40af0494452c4b17ea53dcd
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6cd86184b640893bde9601c71eb9eb1b6f8346de6bfa9683c352648df3032758
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d0d3090e0d2ad049523b37ad3864260982bf2dd923bcb9c67d60ae2be914feb6
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dda630c8cdb2b9f621322bf2b0144974b9e1bfc8ac5daf3d9961a870aa83ceb5
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:35e253c43a4c720421345a62a9ee464316d7b313deffc7e700dbf16e0cf3a9e1
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f4e0066c31be32fc96f83e9b7596b213c56c657e1a64010414c52f6c783fbc4a
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:14e9afbfef35751dbb36b5605228942b1843ecf5776fe0df4cc0e8ee11e4242a
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cf13f0db81fd10d231213d8e53858337c4997da27e24a5fa46fbf05650e3838b
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:72d74f592dbaf2a78b7134b196f03516c7aad8bae49e1680763c4dab45fdfc55
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.10.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:06e826621a1034aca4ee6c5b440fb5ce9d2ca422e08815f4d91f89aa80af1638
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e81ec5b466c031f1efb52b483d7bab61b70eb2e4fe06704dbdddce21e55f84ed
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:05f3c7e72a4f130851dd32347036d4b53be235c5df6dfb4fb50bde8b846657aa
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:04b40897dff4dd52615b8ad920cbb140263b690ad287a83b5b6ea8a8cb5dd72e
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cf4076ccb551740680adcaca9bd6e42d38cf0cedbd416bde7a3e83818e41f545
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e776009dd002aa79ff4244f93bd3d8617da3f6180c0083daf9452b2c24b85c3
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2d7e4394d3522539e2426b932367e304ebe46992b42c9373b35512d2fdc75362
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dbf9e37785f8f1b05948320d4df379eebb8164ec8fc6f6cac46479d1c3aa91ce
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3a8bb7ed65e6d9560d4ffe276686e80f328e4a53f2586ad3034c7a021b51af8a
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:58a36afdd5923c893bba9d57b788b71b846a5abe130b891c14d59ae452658d8f
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e2f9bf4996f86066399fda95b32f0ad3a2e7bfc8d685ac9a15cb0ac98e12dc48
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_15/init/model.layers.11.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5ba9173ae067a6e5e91fc92c14702a8183d788cf61e53aabeba5cd445de90d25
|
3 |
+
size 11395
|