Adding more results
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- params/phi/5/rnd_search_t_no_sched/comb_18/init/lm_head/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.0.mlp.fc1/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.0.mlp.fc2/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.dense/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.k_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.q_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.v_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.1.mlp.fc1/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.1.mlp.fc2/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.dense/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.k_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.q_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.v_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.10.mlp.fc1/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.10.mlp.fc2/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.dense/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.k_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.q_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.v_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.11.mlp.fc1/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.11.mlp.fc2/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.dense/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.k_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.q_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.v_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.12.mlp.fc1/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.12.mlp.fc2/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.dense/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.k_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.q_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.v_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.13.mlp.fc1/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.13.mlp.fc2/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.dense/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.k_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.q_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.v_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.14.mlp.fc1/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.14.mlp.fc2/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.dense/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.k_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.q_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.v_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.15.mlp.fc1/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.15.mlp.fc2/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.dense/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.k_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.q_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.v_proj/_s.pt +3 -0
- params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.16.mlp.fc1/_s.pt +3 -0
params/phi/5/rnd_search_t_no_sched/comb_18/init/lm_head/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c5f7dda4da518c9b487610dc567c15c099d13a1da79dc86ce4839e1fcfeea48e
|
3 |
+
size 205955
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.0.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d48a21677241a115836fe8b13b047a4d916af01f30ee643b5fdd7fab0492f833
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.0.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2c6b52e1973610d4ed0900b53b13c2a9984cbc0ee1c312ef6313809cb2e145bb
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8fcc530ae43d606c52f3ba6e3cd69a17e3388e3a555000c6af58bcf0e83dbf28
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7dcc72b12290201fea6a5dc938e0313d104fa3a6f1148cfe8a58825aed94b6a9
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:577b6a436bde80ea5cebba66284e6c12f6c027d3b507bdcc5f6b28b56ebd7932
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b4d912ff4ddf78085485bfd097eb8dbd94224be5578e1d8f231068c7204e125
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.1.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5507da3c50449f154542caa987c5c5fb1c31c5a6591b16c025224e5141935e3a
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.1.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f74f52e96d7fd77d1c938bc1267740c28bd53eee50251809539ad00b2f91f5cb
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c058238bc62e924259797ed1a5d7fec26fc16c0ada4638e7d3cb1f7d29bf7f0b
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8f5e2665989350573a4027940e96d143e44c983123a3ddef5ab8f7a7304461f4
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:92b7c6893a2fdca4de20282d28517fb77a66fd4d5d1d862a09ca4185a60a33a7
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5259e46aaa3b420374efcbbcb9084831bc1d299b9bbd778fb1018760f3724ee6
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.10.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:18f87e234c34c7188e5e81ca5e985ba39b50361ce080dbd415e2d078ec987468
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.10.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:197ee31d2f05c168b1f5f7f2d271d0e7c0d7797254b9a5d517efeb549d355345
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0684752c787af6fd382f081f65e3e46e34cb0fbd3d049d348f7ddaac7627848b
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b4a9dbfbef345d6e6e0619a7d1c3491ce6bf28c83e0ca256e54891a868980c0
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:619169b3aa4b8fd9b4beffb2a6836eb0cf644b4d283289bc560c5d3d257d4453
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c1deb938a56f8158878edcb45d62d3502fb9928c64888d3fa0bfb6a6424a414e
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.11.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c91722d88ba86b3c167ba3a3fd939f2fd3f9df109ee532635b8fe77c04701b82
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.11.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3a3b0042336e348861841a38a72070acf071d3cea2577de0f7fff4c52652c457
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:781e4cc7499b11c225e4ffa192e70eee25a29fc3abfa064dfd62779726584024
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:68d99e21050cf50201fcf62040c973ba3dcd848659465c9c1d6164cd8b8f86c5
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e37ed8bd8d006f3216a2bdbc9eece28942cb9c6ecbba32abbb2d62e551fbbc2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0362cae6ca6c29eaaa5a1900827ef7206ed70edf8d9d9a300db6dccd44c138e8
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.12.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8d83354214a494734bd3e6f039e322b5241492deddc3ab1309cd894807749667
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.12.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c24c722867630a213b2b32c4aba96c2aae01da0e3a9f9c11eb9c255e3ac66fd9
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6305cf89052bff2485fdd8ddff70ccad39202648314fe3898424de62d2de9c19
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bd5d8d833f74ebc3d07acfc504d07bb2cb0fbac0fab30cc9e5168c192bb6c093
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cf21b36d485857ec70001f19aba0278ac81b52c0b56364e324eae073e02b347a
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a288665bf61e2ac6e7d18d949a9064c3e14e1721d710e82bcf675891ab17926c
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.13.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2ce2d69712c44f2552f7c028c480bf323972db784093d95befbb12f253854e74
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.13.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:47f3d1b67a526e4f7c4e2f6952cfd61c70b0dc6f801aac0733c4fb78791fd8ac
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:09db1408bbaee1938bede1fe7308ffbbc1d53824ea32b3e68cc9cc5ae24cf3b2
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:35d85ae18cbfd7d7aedfd641ffc8666d703b4d482e595955f980f89363f51f28
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a01d0ef3dc0b8f0942244ebed0a9e8b0ee2978a2c3ab3783ddcfd3c708bcee59
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a332306311c03470ca7e060c7a389fc6080fca6cc714d131cf17a818fb36e33a
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.14.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a3ba3ee988b022c336e8e425bbf0944432fcf70113ed889a61b56102a1aad834
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.14.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:00b6d11e361b815408da7cc45bdd3a6f51732d0dc2aea90bbb29028d77548a66
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:97a970d54f87eedfaf76660ee627ea34138bd0b7504aeb3e4af48289e4da7f01
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:11acb470c4127b322fa8880f416f5448b41a1cf14d98293a5cb4fb76a6b8172e
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:161c8371810822a4d6d403f38e1e75a30e682b708f6602824b5fc0d480c6bf32
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:646220168f5c140433de689b5a5e52b3d5971ba245b594bf86f7caaf80f0b045
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.15.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9faacd054e5be373f9d41e9ea7ad3f6298a288456d9de1fa122eb311d8050fb2
|
3 |
+
size 42115
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.15.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:927911fdb8912785f165ef4a3abd7d72a55d3cc2ff0f3f4a65bd573b0c549019
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:92d39d3762b49f3c6e00b294fd7401e268db62657ae535c13bf7343c6d331ce3
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fb555392dca44193cdc6a22f91d8228f7bd6fcdc715b61ba294f307b499e8e5d
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dd0c0154f8a524b1d2c46c3b4912b0558e2cb5c7c610b520f45419a893d9b98a
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:318be03855a526881539570f6e172cce61788a4ca03efdfab54197281e682060
|
3 |
+
size 11395
|
params/phi/5/rnd_search_t_no_sched/comb_18/init/model.layers.16.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7e38151899636a630a9bae9c98eaea4cdfa32fd1774529051579ac2f26f59f6a
|
3 |
+
size 42115
|