Diogo-V commited on
Commit
1901a41
1 Parent(s): 4c85fee

Adding more results

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. params/phi/8/ones_t/comb_14/init/lm_head/_0.pt +3 -0
  2. params/phi/8/ones_t/comb_14/init/lm_head/_s.pt +3 -0
  3. params/phi/8/ones_t/comb_14/init/model.layers.0.mlp.fc1/_0.pt +3 -0
  4. params/phi/8/ones_t/comb_14/init/model.layers.0.mlp.fc1/_s.pt +3 -0
  5. params/phi/8/ones_t/comb_14/init/model.layers.0.mlp.fc2/_0.pt +3 -0
  6. params/phi/8/ones_t/comb_14/init/model.layers.0.mlp.fc2/_s.pt +3 -0
  7. params/phi/8/ones_t/comb_14/init/model.layers.0.self_attn.dense/_0.pt +3 -0
  8. params/phi/8/ones_t/comb_14/init/model.layers.0.self_attn.dense/_s.pt +3 -0
  9. params/phi/8/ones_t/comb_14/init/model.layers.0.self_attn.k_proj/_0.pt +3 -0
  10. params/phi/8/ones_t/comb_14/init/model.layers.0.self_attn.k_proj/_s.pt +3 -0
  11. params/phi/8/ones_t/comb_14/init/model.layers.0.self_attn.q_proj/_0.pt +3 -0
  12. params/phi/8/ones_t/comb_14/init/model.layers.0.self_attn.q_proj/_s.pt +3 -0
  13. params/phi/8/ones_t/comb_14/init/model.layers.0.self_attn.v_proj/_0.pt +3 -0
  14. params/phi/8/ones_t/comb_14/init/model.layers.0.self_attn.v_proj/_s.pt +3 -0
  15. params/phi/8/ones_t/comb_14/init/model.layers.1.mlp.fc1/_0.pt +3 -0
  16. params/phi/8/ones_t/comb_14/init/model.layers.1.mlp.fc1/_s.pt +3 -0
  17. params/phi/8/ones_t/comb_14/init/model.layers.1.mlp.fc2/_0.pt +3 -0
  18. params/phi/8/ones_t/comb_14/init/model.layers.1.mlp.fc2/_s.pt +3 -0
  19. params/phi/8/ones_t/comb_14/init/model.layers.1.self_attn.dense/_0.pt +3 -0
  20. params/phi/8/ones_t/comb_14/init/model.layers.1.self_attn.dense/_s.pt +3 -0
  21. params/phi/8/ones_t/comb_14/init/model.layers.1.self_attn.k_proj/_0.pt +3 -0
  22. params/phi/8/ones_t/comb_14/init/model.layers.1.self_attn.k_proj/_s.pt +3 -0
  23. params/phi/8/ones_t/comb_14/init/model.layers.1.self_attn.q_proj/_0.pt +3 -0
  24. params/phi/8/ones_t/comb_14/init/model.layers.1.self_attn.q_proj/_s.pt +3 -0
  25. params/phi/8/ones_t/comb_14/init/model.layers.1.self_attn.v_proj/_0.pt +3 -0
  26. params/phi/8/ones_t/comb_14/init/model.layers.1.self_attn.v_proj/_s.pt +3 -0
  27. params/phi/8/ones_t/comb_14/init/model.layers.10.mlp.fc1/_0.pt +3 -0
  28. params/phi/8/ones_t/comb_14/init/model.layers.10.mlp.fc1/_s.pt +3 -0
  29. params/phi/8/ones_t/comb_14/init/model.layers.10.mlp.fc2/_0.pt +3 -0
  30. params/phi/8/ones_t/comb_14/init/model.layers.10.mlp.fc2/_s.pt +3 -0
  31. params/phi/8/ones_t/comb_14/init/model.layers.10.self_attn.dense/_0.pt +3 -0
  32. params/phi/8/ones_t/comb_14/init/model.layers.10.self_attn.dense/_s.pt +3 -0
  33. params/phi/8/ones_t/comb_14/init/model.layers.10.self_attn.k_proj/_0.pt +3 -0
  34. params/phi/8/ones_t/comb_14/init/model.layers.10.self_attn.k_proj/_s.pt +3 -0
  35. params/phi/8/ones_t/comb_14/init/model.layers.10.self_attn.q_proj/_0.pt +3 -0
  36. params/phi/8/ones_t/comb_14/init/model.layers.10.self_attn.q_proj/_s.pt +3 -0
  37. params/phi/8/ones_t/comb_14/init/model.layers.10.self_attn.v_proj/_0.pt +3 -0
  38. params/phi/8/ones_t/comb_14/init/model.layers.10.self_attn.v_proj/_s.pt +3 -0
  39. params/phi/8/ones_t/comb_14/init/model.layers.11.mlp.fc1/_0.pt +3 -0
  40. params/phi/8/ones_t/comb_14/init/model.layers.11.mlp.fc1/_s.pt +3 -0
  41. params/phi/8/ones_t/comb_14/init/model.layers.11.mlp.fc2/_0.pt +3 -0
  42. params/phi/8/ones_t/comb_14/init/model.layers.11.mlp.fc2/_s.pt +3 -0
  43. params/phi/8/ones_t/comb_14/init/model.layers.11.self_attn.dense/_0.pt +3 -0
  44. params/phi/8/ones_t/comb_14/init/model.layers.11.self_attn.dense/_s.pt +3 -0
  45. params/phi/8/ones_t/comb_14/init/model.layers.11.self_attn.k_proj/_0.pt +3 -0
  46. params/phi/8/ones_t/comb_14/init/model.layers.11.self_attn.k_proj/_s.pt +3 -0
  47. params/phi/8/ones_t/comb_14/init/model.layers.11.self_attn.q_proj/_0.pt +3 -0
  48. params/phi/8/ones_t/comb_14/init/model.layers.11.self_attn.q_proj/_s.pt +3 -0
  49. params/phi/8/ones_t/comb_14/init/model.layers.11.self_attn.v_proj/_0.pt +3 -0
  50. params/phi/8/ones_t/comb_14/init/model.layers.11.self_attn.v_proj/_s.pt +3 -0
params/phi/8/ones_t/comb_14/init/lm_head/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84c29e156c1ff233ab1d70419ed039b29645b55825ad507a9e5af986fd4ceae9
3
+ size 205955
params/phi/8/ones_t/comb_14/init/lm_head/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a9511da3b259146ff19c2420c69b2e6b9bf77e72155c8025770bd97a174219a
3
+ size 205955
params/phi/8/ones_t/comb_14/init/model.layers.0.mlp.fc1/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
3
+ size 42115
params/phi/8/ones_t/comb_14/init/model.layers.0.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9b59cf216aebacd3d79b358eba73f0fbb3fbf1ce5bf0354479353e0e05100281
3
+ size 42115
params/phi/8/ones_t/comb_14/init/model.layers.0.mlp.fc2/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_14/init/model.layers.0.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:621ecaa46bb5198e7a987cb0556a44c47d6349e0051c7c75f0aba6a5fb523daa
3
+ size 11395
params/phi/8/ones_t/comb_14/init/model.layers.0.self_attn.dense/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_14/init/model.layers.0.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:deb59f3acb343f52c7c12c18be23790ae09bfb88503b0f5148ebfd40d1624fc7
3
+ size 11395
params/phi/8/ones_t/comb_14/init/model.layers.0.self_attn.k_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_14/init/model.layers.0.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23f740c4915269d0bcd6aa75850aa529b3f4a7e070b930b19ac6073ee2babb0d
3
+ size 11395
params/phi/8/ones_t/comb_14/init/model.layers.0.self_attn.q_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_14/init/model.layers.0.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e704537c6a4d2ba564653745d1c5c95905220aea812f819a836c5cf8b259600f
3
+ size 11395
params/phi/8/ones_t/comb_14/init/model.layers.0.self_attn.v_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_14/init/model.layers.0.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44fe1cab3a6b427cd007a8aea0e70ba4869b1d97ed4a5d09bfef82f43c8aade6
3
+ size 11395
params/phi/8/ones_t/comb_14/init/model.layers.1.mlp.fc1/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
3
+ size 42115
params/phi/8/ones_t/comb_14/init/model.layers.1.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ad9ef3a2459fba851d22094be890a7aef5b26af9ce3abb3a3b1450db85adcc38
3
+ size 42115
params/phi/8/ones_t/comb_14/init/model.layers.1.mlp.fc2/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_14/init/model.layers.1.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:829d15baa9b5d2c223382f194cd7cce4269848ba1113284c674ba7e93d00d235
3
+ size 11395
params/phi/8/ones_t/comb_14/init/model.layers.1.self_attn.dense/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_14/init/model.layers.1.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c89560ad1aa5769e990aef7d8dff7ded07f90a1b99ffe1734166c9fb967c9b8
3
+ size 11395
params/phi/8/ones_t/comb_14/init/model.layers.1.self_attn.k_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_14/init/model.layers.1.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05d79124bb599224870df4adf324d36d12b193ff887bdde6614fc32530501f62
3
+ size 11395
params/phi/8/ones_t/comb_14/init/model.layers.1.self_attn.q_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_14/init/model.layers.1.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91436fa7b095e225f8690274a5da65769c3dffde4a921deab5a47d641907a55e
3
+ size 11395
params/phi/8/ones_t/comb_14/init/model.layers.1.self_attn.v_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_14/init/model.layers.1.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d7a412c6cae6c96abab4d8034777cfe6ca9dcb881114a42a5398e62fbb679be
3
+ size 11395
params/phi/8/ones_t/comb_14/init/model.layers.10.mlp.fc1/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
3
+ size 42115
params/phi/8/ones_t/comb_14/init/model.layers.10.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56417683286fc762a110c6680a25c30dc81bfa83b207aace421a7c3fd5d20403
3
+ size 42115
params/phi/8/ones_t/comb_14/init/model.layers.10.mlp.fc2/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_14/init/model.layers.10.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b80fde81daec10870846379b85a20fbf14351c2566ee10d3aea632f1a3e6882
3
+ size 11395
params/phi/8/ones_t/comb_14/init/model.layers.10.self_attn.dense/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_14/init/model.layers.10.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a31c0af8e6e62ac12000b96481acd118748d1c1a6f53bc5ce2e665ee33dd3b1
3
+ size 11395
params/phi/8/ones_t/comb_14/init/model.layers.10.self_attn.k_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_14/init/model.layers.10.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3652005e2d2f30c898e52098a545eb07e8be5172e32d56dd566b02e677533a7c
3
+ size 11395
params/phi/8/ones_t/comb_14/init/model.layers.10.self_attn.q_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_14/init/model.layers.10.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5ded6a8420766b76c9663348c4056b01f0c73a2c663eb12b3b381be514cff55
3
+ size 11395
params/phi/8/ones_t/comb_14/init/model.layers.10.self_attn.v_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_14/init/model.layers.10.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc817a86a39a96580552480752248435479a8f456ab3ac322d05a3284b62ba8b
3
+ size 11395
params/phi/8/ones_t/comb_14/init/model.layers.11.mlp.fc1/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
3
+ size 42115
params/phi/8/ones_t/comb_14/init/model.layers.11.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:efd78ca0a375b4ca306a83b6cc1d1cc8509c05c20939da0ef07e2d4fd012c273
3
+ size 42115
params/phi/8/ones_t/comb_14/init/model.layers.11.mlp.fc2/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_14/init/model.layers.11.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e6204592a517d45785f750f730c8796dec0bf196d3f812222c8b927912d627e
3
+ size 11395
params/phi/8/ones_t/comb_14/init/model.layers.11.self_attn.dense/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_14/init/model.layers.11.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ea5536a40de7592a3cd462b1ce7ab52427872ba8994908c0998b786a788a1cf
3
+ size 11395
params/phi/8/ones_t/comb_14/init/model.layers.11.self_attn.k_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_14/init/model.layers.11.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5c81d7758609ec1b7574e385dee2077e0d4e79da56089c9755f752e9f078d0a
3
+ size 11395
params/phi/8/ones_t/comb_14/init/model.layers.11.self_attn.q_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_14/init/model.layers.11.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c9c8f5a654afa4807110980996f711bbf6a90d8a2e39a930cbca6a7a509a9fdf
3
+ size 11395
params/phi/8/ones_t/comb_14/init/model.layers.11.self_attn.v_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_14/init/model.layers.11.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23f530db255cf20ade993c3b503b9b52a1c1bd6817615b8d18d883496284dd8b
3
+ size 11395