Diogo-V commited on
Commit
d8943ad
1 Parent(s): ed4941a

Adding more results

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. params/phi/7/rnd_search_t_no_sched/comb_18/init/lm_head/_s.pt +3 -0
  2. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.0.mlp.fc1/_s.pt +3 -0
  3. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.0.mlp.fc2/_s.pt +3 -0
  4. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.dense/_s.pt +3 -0
  5. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.k_proj/_s.pt +3 -0
  6. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.q_proj/_s.pt +3 -0
  7. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.v_proj/_s.pt +3 -0
  8. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.1.mlp.fc1/_s.pt +3 -0
  9. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.1.mlp.fc2/_s.pt +3 -0
  10. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.dense/_s.pt +3 -0
  11. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.k_proj/_s.pt +3 -0
  12. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.q_proj/_s.pt +3 -0
  13. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.v_proj/_s.pt +3 -0
  14. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.10.mlp.fc1/_s.pt +3 -0
  15. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.10.mlp.fc2/_s.pt +3 -0
  16. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.dense/_s.pt +3 -0
  17. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.k_proj/_s.pt +3 -0
  18. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.q_proj/_s.pt +3 -0
  19. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.v_proj/_s.pt +3 -0
  20. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.11.mlp.fc1/_s.pt +3 -0
  21. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.11.mlp.fc2/_s.pt +3 -0
  22. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.dense/_s.pt +3 -0
  23. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.k_proj/_s.pt +3 -0
  24. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.q_proj/_s.pt +3 -0
  25. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.v_proj/_s.pt +3 -0
  26. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.12.mlp.fc1/_s.pt +3 -0
  27. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.12.mlp.fc2/_s.pt +3 -0
  28. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.dense/_s.pt +3 -0
  29. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.k_proj/_s.pt +3 -0
  30. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.q_proj/_s.pt +3 -0
  31. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.v_proj/_s.pt +3 -0
  32. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.13.mlp.fc1/_s.pt +3 -0
  33. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.13.mlp.fc2/_s.pt +3 -0
  34. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.dense/_s.pt +3 -0
  35. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.k_proj/_s.pt +3 -0
  36. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.q_proj/_s.pt +3 -0
  37. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.v_proj/_s.pt +3 -0
  38. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.14.mlp.fc1/_s.pt +3 -0
  39. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.14.mlp.fc2/_s.pt +3 -0
  40. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.dense/_s.pt +3 -0
  41. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.k_proj/_s.pt +3 -0
  42. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.q_proj/_s.pt +3 -0
  43. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.v_proj/_s.pt +3 -0
  44. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.15.mlp.fc1/_s.pt +3 -0
  45. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.15.mlp.fc2/_s.pt +3 -0
  46. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.dense/_s.pt +3 -0
  47. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.k_proj/_s.pt +3 -0
  48. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.q_proj/_s.pt +3 -0
  49. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.v_proj/_s.pt +3 -0
  50. params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.16.mlp.fc1/_s.pt +3 -0
params/phi/7/rnd_search_t_no_sched/comb_18/init/lm_head/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:397d112ec929a21a9b6d562bd24ad20b621ea702f4ba6b78a1806e77a1f94ce9
3
+ size 205955
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.0.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e51065266e2d414d8f6705493a86528e55c0f790e4499d0b243045e9bc7c9e0
3
+ size 42115
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.0.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b06fc8d2a1a3fbbb6ea98a916e454fe56c5fbbbab3da57d885a674d88915b10e
3
+ size 11395
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8200bf518dfb61cfb8e196bee65b18f8bc5c870dcb7d0f0650453743c75a4f06
3
+ size 11395
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:483abf1d45b88d7f2983d981c967fd305db260c3b2045777139af1f7e23535d4
3
+ size 11395
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a03305ff556bafcd48ba3fcc3adb368089b71bc3ae19e900d5f649e85e7b60dc
3
+ size 11395
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.0.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5894322535ef3dc0b8c50fdba6eb17612bfadfa0d99f8dfaa7349d98c1bfd00
3
+ size 11395
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.1.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9232b03a3096e4288224bdeb3f797cd38db170c3876b08a057ea689446a54e41
3
+ size 42115
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.1.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0530db145374d8601fe5aa42e18d54a8ca7a16b291bb05e58b28af2d1c4b2067
3
+ size 11395
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b6f3a29e4dd84f877c9cd6a767b14c853aca1357e7f0be48dd20655b3ccf9b2
3
+ size 11395
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ecbbb3d453288cb04c00832500daf83d8523ac5bb70fac12c4cc8afe8b509b58
3
+ size 11395
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:60843038c09890b3d3d4308da52dba8eb68941308164c7bde7754341b0a279b0
3
+ size 11395
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.1.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45f3a94eed2e7b0b5d1ea41dfc1d2a8ba90f34a8786ece8b3c7e4f1a9af44735
3
+ size 11395
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.10.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4384c7e250bb9c27df1f23bf7d02c516e889dc7b3df4f1359d33329edaffda07
3
+ size 42115
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.10.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6a12b0db3af2f44534830dcc00459f91a146994218c7ef086c630eadb007d81
3
+ size 11395
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ebe33798de7c4ed1e2c2e1320b8d5e67a6cf54a0da29af6fc25d5943a9d48652
3
+ size 11395
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef23700cd60b094d66c1349d70015519e6805eed3c3620c94e645b20b3e60d70
3
+ size 11395
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff0d3d40006f99d1225600c0ac74d166a33934df3a498103a77bfbec9dbde57a
3
+ size 11395
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.10.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f7c3a759535ede5933c7c2dfda3c73bd5fe36050db6cae327ce9d767529b08d0
3
+ size 11395
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.11.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f9d4b8edfce047bff8eb35f0c63cb0812e9145f8405656ed944ff8edd02eb3c
3
+ size 42115
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.11.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e3f7ac4a0e9cc195404b3c17a29497ff2a9036d3ce97f84ebbfe210dea016e5
3
+ size 11395
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e8a3316b4121da1fd9d3278fc0ce0aa34bd8da7d7e83dc3d74966414c2ca34ae
3
+ size 11395
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41f7a68e1be78c57378991c76ed05dfc6c29b1a4d44141f3e4ee5e653f46995c
3
+ size 11395
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a304032973429320bc686c63ef871956bea05199d11d1b1bcbe11c724d0e059
3
+ size 11395
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.11.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:680a1d9ef82e1f49fb9c520e0a361ce703a40e31363e2b2f45732138ad79c577
3
+ size 11395
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.12.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5b27bb6ffd835351340168e078520372f392ccbc30f9ec57958e5aa6d1a1789
3
+ size 42115
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.12.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe55afa8dd8627870bebe298704fcaf07a2cf34e3f755e820cdf3aa2e05c7d62
3
+ size 11395
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91f74a1d6300fb912066116ebe5d95ac5d5f59d1369d4b334bb0292c40752340
3
+ size 11395
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1df1ae33d9de03b6c5316318064f2e7340925b27b38608638421d67f5c1d896
3
+ size 11395
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c5c3cea3e593a2e210b9b38b07fdcf7f812f40c79efae6acd9d3bb343b4c5b30
3
+ size 11395
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.12.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775795afe8c4c7ed14a0eabaf4957d221e8ec59b7921acc861a4fc34aa685728
3
+ size 11395
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.13.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa0b191f396dd832a7d16a75a325a1f64eecb1d6d0c22aedf1a2ad0acb945e4f
3
+ size 42115
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.13.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:745203ed2863f1e50072016b2712941ae79fb802ec2d13124f2cccb75ed6dc47
3
+ size 11395
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e35957bb2a20e19d768c9ba0795cfffafa1e05d30928c7e8700b2ec9d1a9fe5
3
+ size 11395
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd6809bc0a8f2485192c14cfc09ec224d77c07ad486806538b52d7e165b437bb
3
+ size 11395
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4801ba22b2de8353c03baf1aea2bb97f4f5757c99f064b1423caf02bdf192d39
3
+ size 11395
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.13.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ebe9c182aca8ffa6d75c67eeedc08806ee5c5a5f7321c706df0cbb3553a018fa
3
+ size 11395
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.14.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66affad8ad1de836d6087b088c07b768abe535b5a98c812f26af7075b2d2b6b6
3
+ size 42115
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.14.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:322de79962a032d926d35d6f9380435e0ffb16dc1337a49084ca889cb7fc0f8c
3
+ size 11395
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d900d95ca7b73d582a36674461245af94b4a4d6148b4dc6b5c6623967d5d67da
3
+ size 11395
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b28a701460bd664b4be219a2cd44a2a196f9869214a1c08457db61f0bd63372b
3
+ size 11395
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b5801a3bc99a57158ba02aa4341e7018b056c30e16c0beb4e326be08ccb9568
3
+ size 11395
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.14.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9b824fc802ff0471fb690214ad359d2cb7eab5e9e31cd767a619469f8d732332
3
+ size 11395
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.15.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d13331aa1a45f3a9b3297bca826009a0d8cbb1d8467b846df8283a58f3a1d17
3
+ size 42115
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.15.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7d5c6005139420bd5013eb8acaeed8d4ec450c0883fec578b191c8e97d6543d
3
+ size 11395
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a77c3d37152492d6fc76088e529ac1cf6ad8787f6ef3a13abfa420311b8fa60
3
+ size 11395
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea6f8e1b9bace5c3b28f55d21f15642cec9df0de018a0baab3875a76aac06555
3
+ size 11395
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f730167b3ad0825f9c8b6e851ea66ce37c898e80b92e344fc1a5066521270a2f
3
+ size 11395
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.15.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:54ccfa66140011f5c15acc58853c1b374cf12df5ca8a340d9b280d767e309099
3
+ size 11395
params/phi/7/rnd_search_t_no_sched/comb_18/init/model.layers.16.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14a002caafff5008157ee6db61e65ebd594d275eb9a0f4cbc99c619af7f7451d
3
+ size 42115