Adding more results
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- params/phi/8/rnd_search_t_no_sched/comb_0/init/lm_head/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/lm_head/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc1/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc1/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc2/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc2/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.dense/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.dense/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.k_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.k_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.q_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.q_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.v_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.v_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc1/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc1/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc2/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc2/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.dense/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.dense/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.k_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.k_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.q_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.q_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.v_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.v_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc1/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc1/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc2/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc2/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.dense/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.dense/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.k_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.k_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.q_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.q_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.v_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.v_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc1/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc1/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc2/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc2/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.dense/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.dense/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.k_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.k_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.q_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.q_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.v_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.v_proj/_s.pt +3 -0
params/phi/8/rnd_search_t_no_sched/comb_0/init/lm_head/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:904758a154c98c640001f446d4c1090c3d467c6c0f2cf531137e85c98eb016d1
|
3 |
+
size 205955
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/lm_head/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a58194e28d6554db10edb6ff5e0f5537f1c4eb7fa9c9faada7e302ab91ac9c40
|
3 |
+
size 205955
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ee1381305e81de94ab396b27da4295667a403d16d85883135bd34d021e0c83f9
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:763b01065191c395a0c258be2c39e01ddc714e002fd915fffab7b52d5ac3cf65
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f416bc773be74ae9c440b8cb04f0aee2a6ad6670d946fe388c5322daa25c9f3d
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2b5065cf306017afed3a60bea224899419fcb29eff9f5aa987ef204eb529589e
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5c11cc15267c7049fb4385ea0e0d29aa8b749131ec34dcbd17840617e04050bb
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1e159ab50e181f0ac7af9682d8d39115a1f2171e783678dfa3bee2393528d447
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1c1dc0fdeab6de176966bcc6cd137a91c38c2c072fbf6914c6b7a64c06a178d8
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f34bb0dec05bdb2524555ff2aa5eafbbeb4b76d53de90b5783eee0f50786909d
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:763b01065191c395a0c258be2c39e01ddc714e002fd915fffab7b52d5ac3cf65
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f62bfec4833f3d5265fc174f6947c437d3e46950945734d4207c4b9910bbacba
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0cf1f1f7b5db34613dd59344bc2f6a418c9f8ee72bddbfef9313765e0911536b
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:145017d0622c6a6009b2c49402a7cb7c62fb06e97cc08bf58a7fddf27bf39e6e
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e50671479105857ac64e90eb67406882446b96c2eb1c850b443fad64d40c7906
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b2c955259ac4ee2a3e63fe898ffb6619141a83193e3f15d748b1010c826ad50a
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2d880633cea9780c4e812fc141b856f7bda15f5688fc700fa57815fff38e8b92
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:703a50ab399b118977dcfd3973e9594df90e456ad7bbc520e7d3d56e76ccb570
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:763b01065191c395a0c258be2c39e01ddc714e002fd915fffab7b52d5ac3cf65
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ff472ebecd1d9252987005f3d7b5ff669f3b5696c8f8a06ef6159088f7174d4f
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c2484cf56a27ed18e3e48bffd3910abc611ad959684f61fd59df0b2efdf4c8b6
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6d1e56262431eda3719185a252d8e868ca336a2b489301b18e44483ecc9aa467
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:056e2a5cccc57414f20a22b8f9329b21e23cdca9ff1edc4995ddb6f72733ceec
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d9d6d5297ce75214d6a2418a4f6ac449c842b64578c092665ac77b3510b184f
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c7ee999bfa9cebb18fb38d2564b3c41fd46644ab59361f6c0e007bef2baf8c2a
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:763b01065191c395a0c258be2c39e01ddc714e002fd915fffab7b52d5ac3cf65
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7deb221504fc1b98a2a401237d29500aff2c8eea1b2cd5827de57c9680a42014
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d2855c8e360729c825ed74dc9c8b09230f654d0b8e387e83a7b11879042a395
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f0487574ae995bf7b46f9bd88d2041ae0f09e6f459652d2bec8dd747ad1f1e05
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:34380eca8bb0bb97fe2c0b1b19343d6fe169138ed9933f9bae883a47e80292d4
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1496fe8fb9f1bee89f1a5605bd9798c09c3a685f00c6375bf8b844bc982c33b5
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c04a05d0e50d92bc324c02713eff1f9e73e9bb797ee57122a975e5092f303c35
|
3 |
+
size 11395
|