Adding more results
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- params/phi/8/rnd_search_t_no_sched/comb_4/init/lm_head/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.0.mlp.fc1/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.0.mlp.fc2/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.0.self_attn.dense/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.0.self_attn.k_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.0.self_attn.q_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.0.self_attn.v_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.1.mlp.fc1/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.1.mlp.fc2/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.1.self_attn.dense/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.1.self_attn.k_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.1.self_attn.q_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.1.self_attn.v_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.10.mlp.fc1/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.10.mlp.fc2/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.10.self_attn.dense/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.10.self_attn.k_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.10.self_attn.q_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.10.self_attn.v_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.11.mlp.fc1/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.11.mlp.fc2/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.11.self_attn.dense/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.11.self_attn.k_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.11.self_attn.q_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.11.self_attn.v_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.12.mlp.fc1/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.12.mlp.fc2/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.12.self_attn.dense/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.12.self_attn.k_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.12.self_attn.q_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.12.self_attn.v_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.13.mlp.fc1/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.13.mlp.fc2/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.13.self_attn.dense/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.13.self_attn.k_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.13.self_attn.q_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.13.self_attn.v_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.14.mlp.fc1/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.14.mlp.fc2/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.14.self_attn.dense/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.14.self_attn.k_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.14.self_attn.q_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.14.self_attn.v_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.15.mlp.fc1/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.15.mlp.fc2/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.15.self_attn.dense/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.15.self_attn.k_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.15.self_attn.q_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.15.self_attn.v_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.16.mlp.fc1/_s.pt +3 -0
params/phi/8/rnd_search_t_no_sched/comb_4/init/lm_head/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e8dc20a0c10ad07e42db91067a99c16a163aaf089f94e9c0f3858d7bb035130
|
3 |
+
size 205955
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.0.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:10a584fa5a48e02489e5e392d1813d8adf36f28e148cdf5afbdcc39abfaaa52a
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.0.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0f0ef7a109ca580f16b100943dac8839028cf8333b5f56ee1fecb92160e6d1b1
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.0.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8d23f2cfd40426b68bbee5058cd9a9a83c889d70f5990533c16d54e628364148
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.0.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ddf48cc51e90faec52b1cc4c229924a3f29727e907e90f30512e6da330c5646a
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.0.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0b72c8370032207aac40d62c0a508a80cfbb0ddd1edcc9c246f4adeccbeb5341
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.0.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:08213392751565fbf83d8e63577e72625e435ceb37958557e5ca0ffc393d05c6
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.1.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8415cac0de7eda0f34ac041244f8fbc3f4adb56565c8b3274ac06c9f9861883e
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.1.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2cbc87600397814f19e97cb67db26d9f644324b28f66bcfa5bf3ac4567e99c6b
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.1.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f482d6ed076e7357ae7d2e80ead31aa7b1c78bd371611399df54e917e67b79e3
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.1.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bc97630a5e70c342d2de9efaa8bf18da092bdab6414e953f7788d8b93041e4ff
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.1.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:771b673e1b4a4baad06e2e4de35ec6c721a966d4f7c502a62cc59297fa36bc64
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.1.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8eefaac7605292b87b812995f6eafe159618beb214975e512589ec7464e1f886
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.10.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:551039478dd6a2b25207b9a815573473cdeca7acbc317a384f3a95f4ecce7b09
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.10.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:981eb60313db1da6d470f05fc4eb24e394cc192c022a7c9166ee951e50b99f3f
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.10.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:36393d4de4e3205129e80779c4c9ae869dffdc68585fda511b4d998b857ac10b
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.10.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea98bef389e97ebde1eb48d1609c6eaa1fa5c27a0cfd58de5799616761f110bb
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.10.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c7b990d0db465c7943664072cb788d92cf2125a4d17ede0bdbae41a9a30c7abf
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.10.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f2141b1e86d1fc3c08942aab863f454a39173540db97967e65b9a4572776112e
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.11.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0d8712cab96958b30688636ebba631acca7c5922562f5b7950794eceff3b302f
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.11.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:823193c0a169a1a525310f59e80acf2ba2b33c99dc9cef48b935ea13834b6379
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.11.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:51264df1814a624e3652243a69123019badf52470276e93043428df6702ba032
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.11.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:53448df6d444ee1031062a94d656bfb1714c0a9a168077b302d0ea83a05e1bfc
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.11.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:27fd194e0e8da836016c472c5fb1b9c022df51c53ae5fcfc3e0ae203d3e6fa92
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.11.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f97ea3a80ee11c6747d735272bd1f1c0c5550b370dfb947291db02ebe70b84eb
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.12.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8123bb0f49cd40f03cdcf3c97253bc85dfbd1d7283a1565dc84721153ed33947
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.12.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b14c0bc721a7a7688fb9615a6f20ac713f65bf879557773591624a9d07861ba7
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.12.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8f9e94c1677b38387886aa90cea71cc5f93525939f0a246c2f97a322bc8961d9
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.12.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ede73915bca083499c6040c7fab360694950da7b3005bad86252b4f9429f669d
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.12.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ebe7029e6de3d5cd6980102364376ed52f8fdd9e4c5c896c9f4b66c4e203606
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.12.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:91aa8990e50ed961fea5c015980a1999e2fadf414b4b6cf55407f31181b16b47
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.13.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1ea9907a0ff645d177d8a0b183f783e95fc3c98211501ae67adff3fc1f631a05
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.13.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:40a6227c7d4ec0d4d1e4d724b77ec9b0ad7dedf52ed8a434d45d5c1d09174fd6
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.13.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:30b657fe835adb8260d4911317be2167e7f969a9026abe152935bef311f9d1f0
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.13.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c6024328fbb3b500e56c3c5c34e484461e79bd86e2af140c7ea59a7cfec84b2e
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.13.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0b83ba27950ed6ed7d48f23227acab26d1a49f170d7119d7bad8c273a04187d5
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.13.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:22340c4a6507eb578b77c7cddd060107e1cb0e3b573623801b3b3f54410967ad
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.14.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:487e9c3d24e13a968d899ccf09dbbc0753e5b0766d39865eb96ed91880585c99
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.14.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:74f0aa738d68932910f59c09793f0547a8a7ac54107a2dda621c7867504b80f5
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.14.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cff9e0249f1b1ff1c4b2321575f3b4a390681fae7a0e07ff6d71c57821ad121e
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.14.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:02120ef320730b6f576f59d40ab2c38ad1ae2b24bf9814ddb4f721082676f24f
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.14.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:500d78483b0d1febefa2f07438ce0a1292cc6d3155a34c1f55260271c833616a
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.14.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eeee5b4fa45426c5bc0c09ccaf4e0f6f47bef936a9d19abe5e75f2ba4401f826
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.15.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d44487f75c105cd109de193cd509518895bea01445b2da530da531de3153d2ac
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.15.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:959bd5cf0da4cf10466646171e5b7085095fe341df4e4366de765c79bbb7ccc2
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.15.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5293e49b80e89d9e2a8ab61a684f042c9b2270c0a608869e20d6a31a8b6a5476
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.15.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:57a486b50157b55fc07d4817d8012fad4a30517bfd959c4de99b9bc54f610954
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.15.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:267d1607531f28f4d3518b810e0c43cb699cbb315e961e8a1df162c8c87a714c
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.15.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31a91ce67e1ea8ae82b047999317ce6a3d2cbe08e89e9decc94ff78f5bf9c9c4
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_4/init/model.layers.16.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:737936eb6662fa4ad7c4d314ab25d321fdbbf868a1e32435bbe340690b766348
|
3 |
+
size 42115
|