Adding more results
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- params/phi/4/rnd_search_t_no_sched/comb_0/init/lm_head/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/lm_head/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc1/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc1/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc2/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc2/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.dense/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.dense/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.k_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.k_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.q_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.q_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.v_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.v_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc1/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc1/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc2/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc2/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.dense/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.dense/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.k_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.k_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.q_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.q_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.v_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.v_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc1/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc1/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc2/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc2/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.dense/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.dense/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.k_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.k_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.q_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.q_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.v_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.v_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc1/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc1/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc2/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc2/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.dense/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.dense/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.k_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.k_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.q_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.q_proj/_s.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.v_proj/_0.pt +3 -0
- params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.v_proj/_s.pt +3 -0
params/phi/4/rnd_search_t_no_sched/comb_0/init/lm_head/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6915dbef73259411dd529b917a1b487cd895b7f73f7a47787b6957730ae9b5d4
|
3 |
+
size 205955
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/lm_head/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0a8cc0cc8fccf5d9a49a612394d57cd0c1fe4a8809046b6f2e572c7bc5136eba
|
3 |
+
size 205955
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cadca7a9383843c75e3560e20cde7b8d5b37d5e87d7640429086dc7fa3610d8b
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d2479639932ee3f58661c26aad37dc49d082241e743e56f58960c7dcf9bec4b6
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fc61ae19f09adedea582eabc1b9bb1ede11a712c1206e1cf990aa67a7bc23f64
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d1c0b6f97756d6087e19f8f3f8bc05a74b365ca93c443783fbd71cf5dabcf789
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bd00b5ccd0f78d75ba763a91d9b221a753cff4d5b6810267264bfd702799e847
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d1c0b6f97756d6087e19f8f3f8bc05a74b365ca93c443783fbd71cf5dabcf789
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ed029b864b4bd6c1b11a00c9ce670a58f5398d7db94ec45fdb880a04f3e4f11
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d1c0b6f97756d6087e19f8f3f8bc05a74b365ca93c443783fbd71cf5dabcf789
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2b3183fce6e59ea207babcc7dea23d9604612263c549866ab540e4d1f35d769f
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d1c0b6f97756d6087e19f8f3f8bc05a74b365ca93c443783fbd71cf5dabcf789
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c1ef8b1a01290b070babae11757b77b2ff0b01acae50233ba34bcb9deb01a1b1
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d1c0b6f97756d6087e19f8f3f8bc05a74b365ca93c443783fbd71cf5dabcf789
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f8f0676ad2c3804c05f6dcb3c190d251a22ccd728b0e5e2df7c3d00638bad1ae
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d2479639932ee3f58661c26aad37dc49d082241e743e56f58960c7dcf9bec4b6
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f55cd8a09b75d30e8a8928cf5575a081c78cf1478f07f74db6fc1a7014762df2
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d1c0b6f97756d6087e19f8f3f8bc05a74b365ca93c443783fbd71cf5dabcf789
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:991634a419cae986dd3ce0ef2dab34583d7fabe33c90f2a338fd2dd9f2476dfe
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d1c0b6f97756d6087e19f8f3f8bc05a74b365ca93c443783fbd71cf5dabcf789
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cc0242a52a8dbc9023736e2f43e8c9bdd50306f18369a7c05d9b17a946337242
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d1c0b6f97756d6087e19f8f3f8bc05a74b365ca93c443783fbd71cf5dabcf789
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ee6b734f034aaa55a4b6be903c7bb15fbd3e85fa9ba25b398871c15637a1f15d
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d1c0b6f97756d6087e19f8f3f8bc05a74b365ca93c443783fbd71cf5dabcf789
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:92315856bbe1c209a5adf6122c5d34b2c21dc695021ad1041e2c1e01c1487b23
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d1c0b6f97756d6087e19f8f3f8bc05a74b365ca93c443783fbd71cf5dabcf789
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ac573bed4927049d74fb0a4c8c969d5728bfb39ec51f78bb07f48f51d1b1346a
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d2479639932ee3f58661c26aad37dc49d082241e743e56f58960c7dcf9bec4b6
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c83d6571f7b6df6ee8095423fc004daa4cf4f6c173b47acc62bb27463519a67b
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d1c0b6f97756d6087e19f8f3f8bc05a74b365ca93c443783fbd71cf5dabcf789
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:37d6abf405bb02cabf850e856880bf74462fdbfc08a4656b396ce5cbc12c8c7f
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d1c0b6f97756d6087e19f8f3f8bc05a74b365ca93c443783fbd71cf5dabcf789
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a3132cecf9198fe1e9046b9365982b1d24a34048b8a972ab7f5eadb40bec4c61
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d1c0b6f97756d6087e19f8f3f8bc05a74b365ca93c443783fbd71cf5dabcf789
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:186bc2515251d63f9befca390af4fcaf47f015429e72283b1d23337380f5909e
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d1c0b6f97756d6087e19f8f3f8bc05a74b365ca93c443783fbd71cf5dabcf789
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:052125549a0a128c4e4d59dc14d0d5bcbb60daf247095f4a87ad34b94bece287
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d1c0b6f97756d6087e19f8f3f8bc05a74b365ca93c443783fbd71cf5dabcf789
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:93218b70a66fd78231e8abb47e180fae01503e71a7d28a0e5f31bf1e304bf6f0
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d2479639932ee3f58661c26aad37dc49d082241e743e56f58960c7dcf9bec4b6
|
3 |
+
size 42115
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3cc8fcb58cc44d61dee4e4ddcf47f25ab8a785ac37ff61036e73a5e8fdbe7c29
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d1c0b6f97756d6087e19f8f3f8bc05a74b365ca93c443783fbd71cf5dabcf789
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d4f4ab6673132e47ee91f00d1c9dc239d00ad65bbfd0285deee4aaf962a91bf0
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d1c0b6f97756d6087e19f8f3f8bc05a74b365ca93c443783fbd71cf5dabcf789
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7525da2ca516b80056314d7a0c7dac0ebfeed626289575b2e876ff91c90b31cd
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d1c0b6f97756d6087e19f8f3f8bc05a74b365ca93c443783fbd71cf5dabcf789
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a5d1ca67727f0b8bb383d00fa7da8de2058a21e36556a16cb45f20e75f8faab0
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d1c0b6f97756d6087e19f8f3f8bc05a74b365ca93c443783fbd71cf5dabcf789
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7d5f10993706e3db82d3428b8b7edc3e287ec42425712b995ca77b24f4914576
|
3 |
+
size 11395
|
params/phi/4/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d1c0b6f97756d6087e19f8f3f8bc05a74b365ca93c443783fbd71cf5dabcf789
|
3 |
+
size 11395
|