Adding more results
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- params/phi/5/rnd_search_t_no_sched/comb_7/init/lm_head/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/lm_head/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.0.mlp.fc1/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.0.mlp.fc1/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.0.mlp.fc2/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.0.mlp.fc2/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.dense/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.dense/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.k_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.k_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.q_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.q_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.v_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.v_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.1.mlp.fc1/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.1.mlp.fc1/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.1.mlp.fc2/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.1.mlp.fc2/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.dense/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.dense/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.k_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.k_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.q_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.q_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.v_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.v_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.10.mlp.fc1/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.10.mlp.fc1/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.10.mlp.fc2/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.10.mlp.fc2/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.dense/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.dense/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.k_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.k_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.q_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.q_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.v_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.v_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.11.mlp.fc1/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.11.mlp.fc1/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.11.mlp.fc2/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.11.mlp.fc2/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.dense/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.dense/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.k_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.k_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.q_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.q_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.v_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.v_proj/_s.pt +3 -0
params/phi/5/rnd_search_t_no_sched/comb_7/init/lm_head/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:84c29e156c1ff233ab1d70419ed039b29645b55825ad507a9e5af986fd4ceae9
|
3 |
+
size 205955
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/lm_head/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f27ad4415b66de9986ce7063d9feaab11174fd4d63dc869e57b52b8a1c4c91a9
|
3 |
+
size 205955
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.0.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.0.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:38261ff59332c8d2783b1c1d4e012b4a183dcbd70e0d1e3faf3b8615daa2d87f
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.0.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.0.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e30596b9b651a2b73557b4b4502622783546af7e265cc36dca7e77eb964b39f0
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ef1837e86e054dd898a6993f3e8c2045df8f3a157a041f0148540843288a679d
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7556ac38cfeeee9f139217d2bf9468707c94cdc1c05f4c3bcf9a6253c3e3c4d0
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:626c4ff0e1f10f269bb53262916dbc31b1a89b980baf41c02843439c0634a5b7
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.0.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a29255243cf6200e7e02fed3ab818e8af50c6154e3903a5da84e402699293f65
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.1.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.1.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c67b69bd198092fc013a81adc4613edf6283f2624785b5b622376e810b650a90
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.1.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.1.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c27f94322363a6f1cdf8a7c734d7c70fd7d3962f17fd1f4f34743251ae81dfde
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c79c55332ba32cdc9eeb4ac8a28ce58999ea012d91412998e0543991b3ee7d82
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:04910f629f65bcc746146a59721550da6559756078c64c7f6f2d58cdc1e35051
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1ce2af06ad80d23a48752055679eb337a34cd28a83b2c8001ca32845b1e598c4
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.1.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4813f42aced8513ddd26dba360847ce7b30e6207bdbc463875aa10ee845a6991
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.10.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.10.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:48938085563297c4d91c931f19ea9790407eea1c3058010ad01ab263cc4144fd
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.10.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.10.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0c5b34aa338357e1c67c2fc568d35772bb8765ad5b0c06f031cb8830b57341c1
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9fcff40067ee13fa2a34f5407523a34aeda6d2fbcec37e5f8d1a92084366cca5
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1130418082c99455e72fabeb327516e736af76ce5065dac0dc7c4919fce7f148
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1309ee4d6d2225039697444794d1d579f3d9e2b93a8e4f681481b7d8be66267c
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.10.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:78c7b2dc10bb9c1363ced128dbc55d3bfcabe52bbc100ffcbf3d7f7cbcc8bbc3
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.11.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.11.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:980b5c23e2c6a7f829a7a75554e8f2b221d6e1cea16bd866d0f43f9922370e38
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.11.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.11.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b49db455367122c1297a94ce683b3d6d8d0c158807ba3433fcfdc5d7f0e0ebec
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d40ff32e80fcaf1d67153c0edb9af5837317cc4ec1e3f3666296ad397af64c98
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eaeaae77ebbe273a053f975823076b04f3c5c58aaa06a88dc95ff8df2f49a2ab
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:62bf32c133bd9c5153ba8315d0cbcb2dd75c79d5384bd324d6bf4dad73ff574f
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_7/init/model.layers.11.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1c1ac2fbb8fb0f7048bf5b64ad30b6377d8b8623980303dce425b313f0da7342
|
3 |
+
size 11395
|