Diogo-V commited on
Commit
c8798b4
1 Parent(s): ba66d81

Adding more results

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. params/phi/4/rnd_search_t_no_sched/comb_11/init/lm_head/_0.pt +3 -0
  2. params/phi/4/rnd_search_t_no_sched/comb_11/init/lm_head/_s.pt +3 -0
  3. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc1/_0.pt +3 -0
  4. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc1/_s.pt +3 -0
  5. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc2/_0.pt +3 -0
  6. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc2/_s.pt +3 -0
  7. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.dense/_0.pt +3 -0
  8. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.dense/_s.pt +3 -0
  9. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.k_proj/_0.pt +3 -0
  10. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.k_proj/_s.pt +3 -0
  11. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.q_proj/_0.pt +3 -0
  12. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.q_proj/_s.pt +3 -0
  13. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.v_proj/_0.pt +3 -0
  14. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.v_proj/_s.pt +3 -0
  15. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc1/_0.pt +3 -0
  16. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc1/_s.pt +3 -0
  17. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc2/_0.pt +3 -0
  18. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc2/_s.pt +3 -0
  19. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.dense/_0.pt +3 -0
  20. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.dense/_s.pt +3 -0
  21. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.k_proj/_0.pt +3 -0
  22. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.k_proj/_s.pt +3 -0
  23. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.q_proj/_0.pt +3 -0
  24. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.q_proj/_s.pt +3 -0
  25. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.v_proj/_0.pt +3 -0
  26. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.v_proj/_s.pt +3 -0
  27. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc1/_0.pt +3 -0
  28. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc1/_s.pt +3 -0
  29. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc2/_0.pt +3 -0
  30. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc2/_s.pt +3 -0
  31. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.dense/_0.pt +3 -0
  32. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.dense/_s.pt +3 -0
  33. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.k_proj/_0.pt +3 -0
  34. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.k_proj/_s.pt +3 -0
  35. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.q_proj/_0.pt +3 -0
  36. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.q_proj/_s.pt +3 -0
  37. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.v_proj/_0.pt +3 -0
  38. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.v_proj/_s.pt +3 -0
  39. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc1/_0.pt +3 -0
  40. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc1/_s.pt +3 -0
  41. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc2/_0.pt +3 -0
  42. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc2/_s.pt +3 -0
  43. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.dense/_0.pt +3 -0
  44. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.dense/_s.pt +3 -0
  45. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.k_proj/_0.pt +3 -0
  46. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.k_proj/_s.pt +3 -0
  47. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.q_proj/_0.pt +3 -0
  48. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.q_proj/_s.pt +3 -0
  49. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.v_proj/_0.pt +3 -0
  50. params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.v_proj/_s.pt +3 -0
params/phi/4/rnd_search_t_no_sched/comb_11/init/lm_head/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84c29e156c1ff233ab1d70419ed039b29645b55825ad507a9e5af986fd4ceae9
3
+ size 205955
params/phi/4/rnd_search_t_no_sched/comb_11/init/lm_head/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a63d286686cef7e1a88219cb19f9019238d6b80fe317010ecfaea17b653511be
3
+ size 205955
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc1/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
3
+ size 42115
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:175063cffcd0fe3849bf8e0c30a95aefbf2004ec5e9d3b0b5ccab5a69c2123c4
3
+ size 42115
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc2/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4abaf283c24b88d4a5bd1c856d0dcf1ae90a20d6a0389272196dd2fa9fc077e1
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.dense/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8dea1bfa2b97fa8454b5f5056ae4511d1aee5ecc573d4f1c32ddfe1ffdcf098
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.k_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09b1c4932597015532f16d30b59376904f67fdb2a733b585b72ff1d24c44ed3e
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.q_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4f41bacb44dd2cc12c63ec81b4c3fb202a17625aafaffbadfe16d4bba759a0f
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.v_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:27c189dc3a70501cfe33d08adb18ae3c940bbf4365ba9036eb0a7961e789bb11
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc1/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
3
+ size 42115
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d06db3becaee64ce237d335d8275ba5bd5943af7c6d2bdb066b137ba2734d72
3
+ size 42115
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc2/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d0ff9406289fbc46fb0d1fafb11c9f59a70e59ce1c406ba7e4c2edb1b31e803
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d4c34def52b9d74a55b6a7ee209a923ccfa2b9acd4f64ffc82e8e1ef3f1e0110
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.dense/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:828c11aeaa87617168d7f5d27b7fadf38061447215f3f20e6475aaddd2c7a01b
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.k_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6b3a1c017641958de8c7ba27de0163f4f7ded0d42881a58aaf8bbc6d615368c
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.q_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8128a89902ce98fbd0912798b7c39da2c55282948f1a8d7644947d23be1c00d
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.v_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:beb6bbed83b4eb7bd4e733fbcb241a41ff61483d91d2588bdb70a1e56428786c
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc1/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
3
+ size 42115
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5abc67005a5a1b831938e9bb7eeb47523f5570d1a95d892b6da2f6c656f2b306
3
+ size 42115
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc2/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db852d18abc43d31e59d9b81491e1b861cbba5c2561e1bd12d7e423e1e38e596
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df178fdf5e1f819ecb94eb4d7c42962793ef060a2da68c8b365dbc17f114ada2
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.dense/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1220e2ce344ec474651ebd6ea3d3f89a7ae957d25a00b3b71593f1cb9d366ce9
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.k_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:498290234d06cec336ee9d1d3bfc0b7c2cd1d60b8d4b6f4a234de76a7af32dfa
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.q_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52d52aa054ed98c970c82944694cc6381d9e19e8f92b39a9c1f91ce1b8565241
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.v_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2268137a0c09e1a6edde009b8ab13376b9a85afd9d47cf55469e4eaa530b8a00
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc1/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba26e06fe7b3941a2708ec1ac604877026c88e2bf581fada3c5978c22560f98e
3
+ size 42115
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f01d070e594a6faa8b85195e9e7c97479a0249a27ec3fe747a682541eda3ebb
3
+ size 42115
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc2/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:38f96e425a7a89cb49faae2d1670643efedf4eaf371e3bb7214d58683cbdaced
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.dense/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f6dd986efc7ad61d1c9e8df7bff4b95507bdd205f826afdd69495932a82e5321
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.k_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5f452b5524db2b5bb608d4ad566076ce75925a8132372224b9fe4fd6e8f041d
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.q_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8822852342fb2a912ff50da0476020157b6ac8e8ccb15bb7ce88672f01704619
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.v_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89e0b4a39c31538b92729ed27ddcfcff4647c5b32ccddf9d8a971a4d46a964a2
3
+ size 11395