Adding more results
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- params/phi/5/rnd_search_t_no_sched/comb_5/init/lm_head/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/lm_head/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.0.mlp.fc1/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.0.mlp.fc1/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.0.mlp.fc2/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.0.mlp.fc2/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.dense/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.dense/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.k_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.k_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.q_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.q_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.v_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.v_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.1.mlp.fc1/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.1.mlp.fc1/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.1.mlp.fc2/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.1.mlp.fc2/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.dense/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.dense/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.k_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.k_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.q_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.q_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.v_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.v_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.10.mlp.fc1/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.10.mlp.fc1/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.10.mlp.fc2/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.10.mlp.fc2/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.dense/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.dense/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.k_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.k_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.q_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.q_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.v_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.v_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.11.mlp.fc1/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.11.mlp.fc1/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.11.mlp.fc2/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.11.mlp.fc2/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.dense/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.dense/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.k_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.k_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.q_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.q_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.v_proj/_0.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.v_proj/_s.pt +3 -0
params/phi/5/rnd_search_t_no_sched/comb_5/init/lm_head/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:49587ff544689519441b1432152f2196030d480e55f2560b4553a65564f0b7d1
|
3 |
+
size 205955
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/lm_head/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:04f2010e0c324c3b9557ed987d2570ca8b951f440959b3f852513fad2373e62e
|
3 |
+
size 205955
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.0.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b4b7bafe680c7d1c2bb2c35bf193924e8e88cde3d903464b1cde1e21ae1f31b2
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.0.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:62bdc3f418bffd4bae2af2754fa349ea2c14aa8de2d65c2282558830fddd3e23
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.0.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:127b44ab64140eeecf9e2ae93422e3234c95bdc5a70ee6a2235f855f8fb73f62
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.0.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b9cc3cb76c9a3f8df62a59efe6464242fab58db91a0bf4e5a08b013796b4b3f7
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cc61fbb56173aeee5abba7408010b20f5af21361f53264230592e899312393a0
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d64dfb7dfc2bc530e077f434e218bb072576b7fe773acf788189eb6573705dc0
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e7994d5debf9021c01cce41b0426a249c656faa9fa1bd5a1a6dd41dd9ed0a690
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ad1b9448ba5ac974585e662df213362f70eb76125e8784a1ad286d060210dc34
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8167bf8cd45ce448141387c65beb76a1da1708b4f192cad9045f32b593a1f39a
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cfd99d8f38219502d77c746b2828645841d6f8a9c68c8d5a817234982a6a6d1a
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:63ad275eb86067c886288ca2ac155e1bed7d7c278f6b4aaa697ee9d1572589a0
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.0.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df6f348616ddaea10df02c4ce06c2005da4c92fea737fe828ada7c0b82fdffdb
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.1.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ae2630cd239e0013cc812704d9bf8bc5fb2062718f39e60ad5773f7d605839ec
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.1.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:15264a75ac5dbc1c319d7a11edafb0d535372b78a85bb17ec9362a3604ce583c
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.1.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fcc9455dd35edb329643e1c2763b8ed640e665ccf415cb9c8b06dc968f496a0e
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.1.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a38a4e599445c7dfe00c6687ac7f3366f1e16e2f801c8055278d2686a3ca48c1
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2db0213c31a7c9cc93d15d51cf2bf1f3b452a0277a7432079038fd7c6c11b3af
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:76e1e620cee779d612bb0c92900da40b2a4892297bc4d4ef0cfdc9cdfd4c5df9
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6bf3c554c964eff50ff9a48a000269c14125a14a239b035d22b40241dcb7f27a
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:81251d9a4a516a3c4b86814a354ad0fc7e2f9542fe9056812b16a592bd1cacf9
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b8655a6ff3dc50de40ec60d5ba73b5bec475ce68c7ad78ae587810fcf53aabcd
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5cc7a9d696ae47e57a0e4f031fd971546e432b079b5a350855b0c549aa5ab011
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a5dbaf6e3b52497e07114e3742a0016e49d9dff71fba4a2e5931e32e6369c56a
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.1.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:07bbb755fe4b6eb4b597934f140fd9a9bfadfca859eb055da22cfb1c5d89fc6d
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.10.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c44fba23b4ebcda0906989afd223ba825407de45abeac514cb3c6a3cf7712fe
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.10.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:77cce3300c3b67c7d2e8b21eb95aa8f4deb0e3fdbfded392ffabff700341a796
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.10.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fba8c645f21bb066d58be4dcd15b7b97c1bc8bec9b34b639ff4fd068edc24f88
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.10.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f7fed8733a3c90c08c6fa080e5a043bc508930dfc2accbed1c53ef877464ea12
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fc6143040a641871ba459f35402eab3eaf2fee1d67c866ba2d41923d1a219b6f
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a7e617ce797444efebbb592d141d6f3d9b6885be4e26b2997567acea37f329d4
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:97719aba4cddc5678328180926c2e3a7e46db939b091c816e062612d3fc7a00f
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0a139fad3c60ea640bd704af7b7e120359cedcf1854fa37679153d56457fb07f
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d482385c418d0d7bb027627381f6dcfccf14c4faa02e419f176c6886323c08f3
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9e10550295afecd60fff9fd19a6d646728f4962aa9de115556841128920355c5
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2ab1cebbb84b1991c25508197b7f5882483cec614e787ff597853886b98538a5
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.10.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0c25dd3438c7b861f89f14507feb073300455234996e5a445f071b5209e4197a
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.11.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2a7e723e34eca9c6372c2fda1a505a3347f6cffcd15aaeb842c8a50e948d56be
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.11.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:51ff740af29773af268612541ae02c32de5d654584b35b1bba32f0a0fc7689ee
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.11.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c6023a1737e3322d37967da7077a5c23cde6218d09be7dc45eb8c8e7e814ddae
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.11.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5ada2b24bc38ec4f4178b44879f2a676d144d2b3ca10eb88436ebf9d433a5e21
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e7e6f567a4fa1df10f3628f7ebd0892f532bc8e45b56457a7a08b4dd29b209fe
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cd2104e86b0b0c5a141969b92e58eb56be556cd006b9c85d32905dab19b0b249
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b9955c8bc4ba37ae4c98be06f28aa4701830330b92f27bf4c20b8c7a04fa70e
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fa07572fb9ff76d8a36deda7e09a3f50a51bb3a1237c486b55e65ab66b3833cd
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a6048c4db803698a0212bf77b1ada0566a9e4848dcd6441881fed7d2c1303a55
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d61c14553d168df887ac2d189b04515566739c87dda4f89669c52014fc9a743e
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e2d964e6266adaf9807cd92fdc5a7fe3f9d4c45ca532f5fb11ed5a950d9c88ff
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_5/init/model.layers.11.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7290e84377a2a0a0cc3dd295ece54c83bc038c7e21e5be16ac39ca99fe02804a
|
3 |
+
size 11395
|