Diogo-V commited on
Commit
8073e89
1 Parent(s): b1e4c9f

Adding more results

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. params/phi/8/ones_t/comb_8/init/lm_head/_0.pt +3 -0
  2. params/phi/8/ones_t/comb_8/init/lm_head/_s.pt +3 -0
  3. params/phi/8/ones_t/comb_8/init/model.layers.0.mlp.fc1/_0.pt +3 -0
  4. params/phi/8/ones_t/comb_8/init/model.layers.0.mlp.fc1/_s.pt +3 -0
  5. params/phi/8/ones_t/comb_8/init/model.layers.0.mlp.fc2/_0.pt +3 -0
  6. params/phi/8/ones_t/comb_8/init/model.layers.0.mlp.fc2/_s.pt +3 -0
  7. params/phi/8/ones_t/comb_8/init/model.layers.0.self_attn.dense/_0.pt +3 -0
  8. params/phi/8/ones_t/comb_8/init/model.layers.0.self_attn.dense/_s.pt +3 -0
  9. params/phi/8/ones_t/comb_8/init/model.layers.0.self_attn.k_proj/_0.pt +3 -0
  10. params/phi/8/ones_t/comb_8/init/model.layers.0.self_attn.k_proj/_s.pt +3 -0
  11. params/phi/8/ones_t/comb_8/init/model.layers.0.self_attn.q_proj/_0.pt +3 -0
  12. params/phi/8/ones_t/comb_8/init/model.layers.0.self_attn.q_proj/_s.pt +3 -0
  13. params/phi/8/ones_t/comb_8/init/model.layers.0.self_attn.v_proj/_0.pt +3 -0
  14. params/phi/8/ones_t/comb_8/init/model.layers.0.self_attn.v_proj/_s.pt +3 -0
  15. params/phi/8/ones_t/comb_8/init/model.layers.1.mlp.fc1/_0.pt +3 -0
  16. params/phi/8/ones_t/comb_8/init/model.layers.1.mlp.fc1/_s.pt +3 -0
  17. params/phi/8/ones_t/comb_8/init/model.layers.1.mlp.fc2/_0.pt +3 -0
  18. params/phi/8/ones_t/comb_8/init/model.layers.1.mlp.fc2/_s.pt +3 -0
  19. params/phi/8/ones_t/comb_8/init/model.layers.1.self_attn.dense/_0.pt +3 -0
  20. params/phi/8/ones_t/comb_8/init/model.layers.1.self_attn.dense/_s.pt +3 -0
  21. params/phi/8/ones_t/comb_8/init/model.layers.1.self_attn.k_proj/_0.pt +3 -0
  22. params/phi/8/ones_t/comb_8/init/model.layers.1.self_attn.k_proj/_s.pt +3 -0
  23. params/phi/8/ones_t/comb_8/init/model.layers.1.self_attn.q_proj/_0.pt +3 -0
  24. params/phi/8/ones_t/comb_8/init/model.layers.1.self_attn.q_proj/_s.pt +3 -0
  25. params/phi/8/ones_t/comb_8/init/model.layers.1.self_attn.v_proj/_0.pt +3 -0
  26. params/phi/8/ones_t/comb_8/init/model.layers.1.self_attn.v_proj/_s.pt +3 -0
  27. params/phi/8/ones_t/comb_8/init/model.layers.10.mlp.fc1/_0.pt +3 -0
  28. params/phi/8/ones_t/comb_8/init/model.layers.10.mlp.fc1/_s.pt +3 -0
  29. params/phi/8/ones_t/comb_8/init/model.layers.10.mlp.fc2/_0.pt +3 -0
  30. params/phi/8/ones_t/comb_8/init/model.layers.10.mlp.fc2/_s.pt +3 -0
  31. params/phi/8/ones_t/comb_8/init/model.layers.10.self_attn.dense/_0.pt +3 -0
  32. params/phi/8/ones_t/comb_8/init/model.layers.10.self_attn.dense/_s.pt +3 -0
  33. params/phi/8/ones_t/comb_8/init/model.layers.10.self_attn.k_proj/_0.pt +3 -0
  34. params/phi/8/ones_t/comb_8/init/model.layers.10.self_attn.k_proj/_s.pt +3 -0
  35. params/phi/8/ones_t/comb_8/init/model.layers.10.self_attn.q_proj/_0.pt +3 -0
  36. params/phi/8/ones_t/comb_8/init/model.layers.10.self_attn.q_proj/_s.pt +3 -0
  37. params/phi/8/ones_t/comb_8/init/model.layers.10.self_attn.v_proj/_0.pt +3 -0
  38. params/phi/8/ones_t/comb_8/init/model.layers.10.self_attn.v_proj/_s.pt +3 -0
  39. params/phi/8/ones_t/comb_8/init/model.layers.11.mlp.fc1/_0.pt +3 -0
  40. params/phi/8/ones_t/comb_8/init/model.layers.11.mlp.fc1/_s.pt +3 -0
  41. params/phi/8/ones_t/comb_8/init/model.layers.11.mlp.fc2/_0.pt +3 -0
  42. params/phi/8/ones_t/comb_8/init/model.layers.11.mlp.fc2/_s.pt +3 -0
  43. params/phi/8/ones_t/comb_8/init/model.layers.11.self_attn.dense/_0.pt +3 -0
  44. params/phi/8/ones_t/comb_8/init/model.layers.11.self_attn.dense/_s.pt +3 -0
  45. params/phi/8/ones_t/comb_8/init/model.layers.11.self_attn.k_proj/_0.pt +3 -0
  46. params/phi/8/ones_t/comb_8/init/model.layers.11.self_attn.k_proj/_s.pt +3 -0
  47. params/phi/8/ones_t/comb_8/init/model.layers.11.self_attn.q_proj/_0.pt +3 -0
  48. params/phi/8/ones_t/comb_8/init/model.layers.11.self_attn.q_proj/_s.pt +3 -0
  49. params/phi/8/ones_t/comb_8/init/model.layers.11.self_attn.v_proj/_0.pt +3 -0
  50. params/phi/8/ones_t/comb_8/init/model.layers.11.self_attn.v_proj/_s.pt +3 -0
params/phi/8/ones_t/comb_8/init/lm_head/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84c29e156c1ff233ab1d70419ed039b29645b55825ad507a9e5af986fd4ceae9
3
+ size 205955
params/phi/8/ones_t/comb_8/init/lm_head/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:422a4459bbb67a0bf7b85794c92662003a87c4d2616b6c4901d8913fd0fc8459
3
+ size 205955
params/phi/8/ones_t/comb_8/init/model.layers.0.mlp.fc1/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
3
+ size 42115
params/phi/8/ones_t/comb_8/init/model.layers.0.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e81ec5b466c031f1efb52b483d7bab61b70eb2e4fe06704dbdddce21e55f84ed
3
+ size 42115
params/phi/8/ones_t/comb_8/init/model.layers.0.mlp.fc2/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_8/init/model.layers.0.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e265bc891ad21bad20193c00328207b279f78cba507ede5563f3cb2078851c0
3
+ size 11395
params/phi/8/ones_t/comb_8/init/model.layers.0.self_attn.dense/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_8/init/model.layers.0.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e265bc891ad21bad20193c00328207b279f78cba507ede5563f3cb2078851c0
3
+ size 11395
params/phi/8/ones_t/comb_8/init/model.layers.0.self_attn.k_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_8/init/model.layers.0.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e265bc891ad21bad20193c00328207b279f78cba507ede5563f3cb2078851c0
3
+ size 11395
params/phi/8/ones_t/comb_8/init/model.layers.0.self_attn.q_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_8/init/model.layers.0.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e265bc891ad21bad20193c00328207b279f78cba507ede5563f3cb2078851c0
3
+ size 11395
params/phi/8/ones_t/comb_8/init/model.layers.0.self_attn.v_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_8/init/model.layers.0.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e265bc891ad21bad20193c00328207b279f78cba507ede5563f3cb2078851c0
3
+ size 11395
params/phi/8/ones_t/comb_8/init/model.layers.1.mlp.fc1/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
3
+ size 42115
params/phi/8/ones_t/comb_8/init/model.layers.1.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e81ec5b466c031f1efb52b483d7bab61b70eb2e4fe06704dbdddce21e55f84ed
3
+ size 42115
params/phi/8/ones_t/comb_8/init/model.layers.1.mlp.fc2/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_8/init/model.layers.1.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e265bc891ad21bad20193c00328207b279f78cba507ede5563f3cb2078851c0
3
+ size 11395
params/phi/8/ones_t/comb_8/init/model.layers.1.self_attn.dense/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_8/init/model.layers.1.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e265bc891ad21bad20193c00328207b279f78cba507ede5563f3cb2078851c0
3
+ size 11395
params/phi/8/ones_t/comb_8/init/model.layers.1.self_attn.k_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_8/init/model.layers.1.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e265bc891ad21bad20193c00328207b279f78cba507ede5563f3cb2078851c0
3
+ size 11395
params/phi/8/ones_t/comb_8/init/model.layers.1.self_attn.q_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_8/init/model.layers.1.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e265bc891ad21bad20193c00328207b279f78cba507ede5563f3cb2078851c0
3
+ size 11395
params/phi/8/ones_t/comb_8/init/model.layers.1.self_attn.v_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_8/init/model.layers.1.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e265bc891ad21bad20193c00328207b279f78cba507ede5563f3cb2078851c0
3
+ size 11395
params/phi/8/ones_t/comb_8/init/model.layers.10.mlp.fc1/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
3
+ size 42115
params/phi/8/ones_t/comb_8/init/model.layers.10.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e81ec5b466c031f1efb52b483d7bab61b70eb2e4fe06704dbdddce21e55f84ed
3
+ size 42115
params/phi/8/ones_t/comb_8/init/model.layers.10.mlp.fc2/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_8/init/model.layers.10.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e265bc891ad21bad20193c00328207b279f78cba507ede5563f3cb2078851c0
3
+ size 11395
params/phi/8/ones_t/comb_8/init/model.layers.10.self_attn.dense/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_8/init/model.layers.10.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e265bc891ad21bad20193c00328207b279f78cba507ede5563f3cb2078851c0
3
+ size 11395
params/phi/8/ones_t/comb_8/init/model.layers.10.self_attn.k_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_8/init/model.layers.10.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e265bc891ad21bad20193c00328207b279f78cba507ede5563f3cb2078851c0
3
+ size 11395
params/phi/8/ones_t/comb_8/init/model.layers.10.self_attn.q_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_8/init/model.layers.10.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e265bc891ad21bad20193c00328207b279f78cba507ede5563f3cb2078851c0
3
+ size 11395
params/phi/8/ones_t/comb_8/init/model.layers.10.self_attn.v_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_8/init/model.layers.10.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e265bc891ad21bad20193c00328207b279f78cba507ede5563f3cb2078851c0
3
+ size 11395
params/phi/8/ones_t/comb_8/init/model.layers.11.mlp.fc1/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
3
+ size 42115
params/phi/8/ones_t/comb_8/init/model.layers.11.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e81ec5b466c031f1efb52b483d7bab61b70eb2e4fe06704dbdddce21e55f84ed
3
+ size 42115
params/phi/8/ones_t/comb_8/init/model.layers.11.mlp.fc2/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_8/init/model.layers.11.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e265bc891ad21bad20193c00328207b279f78cba507ede5563f3cb2078851c0
3
+ size 11395
params/phi/8/ones_t/comb_8/init/model.layers.11.self_attn.dense/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_8/init/model.layers.11.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e265bc891ad21bad20193c00328207b279f78cba507ede5563f3cb2078851c0
3
+ size 11395
params/phi/8/ones_t/comb_8/init/model.layers.11.self_attn.k_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_8/init/model.layers.11.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e265bc891ad21bad20193c00328207b279f78cba507ede5563f3cb2078851c0
3
+ size 11395
params/phi/8/ones_t/comb_8/init/model.layers.11.self_attn.q_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_8/init/model.layers.11.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e265bc891ad21bad20193c00328207b279f78cba507ede5563f3cb2078851c0
3
+ size 11395
params/phi/8/ones_t/comb_8/init/model.layers.11.self_attn.v_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_8/init/model.layers.11.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e265bc891ad21bad20193c00328207b279f78cba507ede5563f3cb2078851c0
3
+ size 11395