Diogo-V commited on
Commit
f00c206
1 Parent(s): a3712a7

Adding more results

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. params/phi/8/ones_t/comb_12/init/lm_head/_0.pt +3 -0
  2. params/phi/8/ones_t/comb_12/init/lm_head/_s.pt +3 -0
  3. params/phi/8/ones_t/comb_12/init/model.layers.0.mlp.fc1/_0.pt +3 -0
  4. params/phi/8/ones_t/comb_12/init/model.layers.0.mlp.fc1/_s.pt +3 -0
  5. params/phi/8/ones_t/comb_12/init/model.layers.0.mlp.fc2/_0.pt +3 -0
  6. params/phi/8/ones_t/comb_12/init/model.layers.0.mlp.fc2/_s.pt +3 -0
  7. params/phi/8/ones_t/comb_12/init/model.layers.0.self_attn.dense/_0.pt +3 -0
  8. params/phi/8/ones_t/comb_12/init/model.layers.0.self_attn.dense/_s.pt +3 -0
  9. params/phi/8/ones_t/comb_12/init/model.layers.0.self_attn.k_proj/_0.pt +3 -0
  10. params/phi/8/ones_t/comb_12/init/model.layers.0.self_attn.k_proj/_s.pt +3 -0
  11. params/phi/8/ones_t/comb_12/init/model.layers.0.self_attn.q_proj/_0.pt +3 -0
  12. params/phi/8/ones_t/comb_12/init/model.layers.0.self_attn.q_proj/_s.pt +3 -0
  13. params/phi/8/ones_t/comb_12/init/model.layers.0.self_attn.v_proj/_0.pt +3 -0
  14. params/phi/8/ones_t/comb_12/init/model.layers.0.self_attn.v_proj/_s.pt +3 -0
  15. params/phi/8/ones_t/comb_12/init/model.layers.1.mlp.fc1/_0.pt +3 -0
  16. params/phi/8/ones_t/comb_12/init/model.layers.1.mlp.fc1/_s.pt +3 -0
  17. params/phi/8/ones_t/comb_12/init/model.layers.1.mlp.fc2/_0.pt +3 -0
  18. params/phi/8/ones_t/comb_12/init/model.layers.1.mlp.fc2/_s.pt +3 -0
  19. params/phi/8/ones_t/comb_12/init/model.layers.1.self_attn.dense/_0.pt +3 -0
  20. params/phi/8/ones_t/comb_12/init/model.layers.1.self_attn.dense/_s.pt +3 -0
  21. params/phi/8/ones_t/comb_12/init/model.layers.1.self_attn.k_proj/_0.pt +3 -0
  22. params/phi/8/ones_t/comb_12/init/model.layers.1.self_attn.k_proj/_s.pt +3 -0
  23. params/phi/8/ones_t/comb_12/init/model.layers.1.self_attn.q_proj/_0.pt +3 -0
  24. params/phi/8/ones_t/comb_12/init/model.layers.1.self_attn.q_proj/_s.pt +3 -0
  25. params/phi/8/ones_t/comb_12/init/model.layers.1.self_attn.v_proj/_0.pt +3 -0
  26. params/phi/8/ones_t/comb_12/init/model.layers.1.self_attn.v_proj/_s.pt +3 -0
  27. params/phi/8/ones_t/comb_12/init/model.layers.10.mlp.fc1/_0.pt +3 -0
  28. params/phi/8/ones_t/comb_12/init/model.layers.10.mlp.fc1/_s.pt +3 -0
  29. params/phi/8/ones_t/comb_12/init/model.layers.10.mlp.fc2/_0.pt +3 -0
  30. params/phi/8/ones_t/comb_12/init/model.layers.10.mlp.fc2/_s.pt +3 -0
  31. params/phi/8/ones_t/comb_12/init/model.layers.10.self_attn.dense/_0.pt +3 -0
  32. params/phi/8/ones_t/comb_12/init/model.layers.10.self_attn.dense/_s.pt +3 -0
  33. params/phi/8/ones_t/comb_12/init/model.layers.10.self_attn.k_proj/_0.pt +3 -0
  34. params/phi/8/ones_t/comb_12/init/model.layers.10.self_attn.k_proj/_s.pt +3 -0
  35. params/phi/8/ones_t/comb_12/init/model.layers.10.self_attn.q_proj/_0.pt +3 -0
  36. params/phi/8/ones_t/comb_12/init/model.layers.10.self_attn.q_proj/_s.pt +3 -0
  37. params/phi/8/ones_t/comb_12/init/model.layers.10.self_attn.v_proj/_0.pt +3 -0
  38. params/phi/8/ones_t/comb_12/init/model.layers.10.self_attn.v_proj/_s.pt +3 -0
  39. params/phi/8/ones_t/comb_12/init/model.layers.11.mlp.fc1/_0.pt +3 -0
  40. params/phi/8/ones_t/comb_12/init/model.layers.11.mlp.fc1/_s.pt +3 -0
  41. params/phi/8/ones_t/comb_12/init/model.layers.11.mlp.fc2/_0.pt +3 -0
  42. params/phi/8/ones_t/comb_12/init/model.layers.11.mlp.fc2/_s.pt +3 -0
  43. params/phi/8/ones_t/comb_12/init/model.layers.11.self_attn.dense/_0.pt +3 -0
  44. params/phi/8/ones_t/comb_12/init/model.layers.11.self_attn.dense/_s.pt +3 -0
  45. params/phi/8/ones_t/comb_12/init/model.layers.11.self_attn.k_proj/_0.pt +3 -0
  46. params/phi/8/ones_t/comb_12/init/model.layers.11.self_attn.k_proj/_s.pt +3 -0
  47. params/phi/8/ones_t/comb_12/init/model.layers.11.self_attn.q_proj/_0.pt +3 -0
  48. params/phi/8/ones_t/comb_12/init/model.layers.11.self_attn.q_proj/_s.pt +3 -0
  49. params/phi/8/ones_t/comb_12/init/model.layers.11.self_attn.v_proj/_0.pt +3 -0
  50. params/phi/8/ones_t/comb_12/init/model.layers.11.self_attn.v_proj/_s.pt +3 -0
params/phi/8/ones_t/comb_12/init/lm_head/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84c29e156c1ff233ab1d70419ed039b29645b55825ad507a9e5af986fd4ceae9
3
+ size 205955
params/phi/8/ones_t/comb_12/init/lm_head/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d439ef059780596ad9d456e2ee60e37c3210a0069afc0cb2ab825c93b511e07c
3
+ size 205955
params/phi/8/ones_t/comb_12/init/model.layers.0.mlp.fc1/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
3
+ size 42115
params/phi/8/ones_t/comb_12/init/model.layers.0.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02d9e1b8621d5434eab438d59d7773ea638670c294ed2b90d268f9bdaebeba42
3
+ size 42115
params/phi/8/ones_t/comb_12/init/model.layers.0.mlp.fc2/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_12/init/model.layers.0.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:878ab3145ec7db0aef7b479689b120aa096a3dd4ac7a9540768a89562afc188b
3
+ size 11395
params/phi/8/ones_t/comb_12/init/model.layers.0.self_attn.dense/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_12/init/model.layers.0.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d2708e3dfa3e9c0dd5ca53b01efdcc70247030ddd2d230807e6c1eb8b685bac0
3
+ size 11395
params/phi/8/ones_t/comb_12/init/model.layers.0.self_attn.k_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_12/init/model.layers.0.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1113269e0790f1648074beb8ea5eca9e22679a8674deef3a8fbfbf8fb9eb978c
3
+ size 11395
params/phi/8/ones_t/comb_12/init/model.layers.0.self_attn.q_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_12/init/model.layers.0.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:915f78a6092cf6f8d60cff493f0e6f7f805fbd784e03d90c198d826862c0c760
3
+ size 11395
params/phi/8/ones_t/comb_12/init/model.layers.0.self_attn.v_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_12/init/model.layers.0.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16261484a671df104fbc657988ae81e0fb533690b9a5d83ae08c54813cf46e8b
3
+ size 11395
params/phi/8/ones_t/comb_12/init/model.layers.1.mlp.fc1/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
3
+ size 42115
params/phi/8/ones_t/comb_12/init/model.layers.1.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65b25dcbb22dc17b231d9c779df53e0a96248786a3135901b3a26f4e57daa8b6
3
+ size 42115
params/phi/8/ones_t/comb_12/init/model.layers.1.mlp.fc2/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_12/init/model.layers.1.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:867d2d71d9548dcdeca47965044476357a8c56460fdecf6eb011aea0e924958a
3
+ size 11395
params/phi/8/ones_t/comb_12/init/model.layers.1.self_attn.dense/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_12/init/model.layers.1.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ebbcd50c20e396a5743c6d524f77eccd986e700d740ff4ced5b5d47b51993f0
3
+ size 11395
params/phi/8/ones_t/comb_12/init/model.layers.1.self_attn.k_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_12/init/model.layers.1.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b944edcb5043be7b91cc868417131ae6c1b661a0cc1d020626d0cf95c7d54bab
3
+ size 11395
params/phi/8/ones_t/comb_12/init/model.layers.1.self_attn.q_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_12/init/model.layers.1.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6e1b01bd29981ce7e940a50fed50e3c86a3e157e6e233f539d4bd25ce34090f1
3
+ size 11395
params/phi/8/ones_t/comb_12/init/model.layers.1.self_attn.v_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_12/init/model.layers.1.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:51d779c10d616c2607535e2038882c66aa45980b6fc5b4dc90eb858e2f190536
3
+ size 11395
params/phi/8/ones_t/comb_12/init/model.layers.10.mlp.fc1/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
3
+ size 42115
params/phi/8/ones_t/comb_12/init/model.layers.10.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1e587d3abd7be00c3d8b3ba8fadef3bd30865d8804d754e777ac747e4f8c8e4
3
+ size 42115
params/phi/8/ones_t/comb_12/init/model.layers.10.mlp.fc2/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_12/init/model.layers.10.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac61d30530b00de25b0fd5f943561c36764ea8b2504c30140fa10fc4aa0f0634
3
+ size 11395
params/phi/8/ones_t/comb_12/init/model.layers.10.self_attn.dense/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_12/init/model.layers.10.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7be0202026e4b14d5e6f6c6fdc290e6fac2e222db1bb909f725a69f297fb05d
3
+ size 11395
params/phi/8/ones_t/comb_12/init/model.layers.10.self_attn.k_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_12/init/model.layers.10.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da4f77473e588432f4e7d307dbfefa869d770a0a10876188c5df7485f932d772
3
+ size 11395
params/phi/8/ones_t/comb_12/init/model.layers.10.self_attn.q_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_12/init/model.layers.10.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4cecee159ce61a983b2c7496668b36c2c2e47141892b45b08450e8a457fb9ac6
3
+ size 11395
params/phi/8/ones_t/comb_12/init/model.layers.10.self_attn.v_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_12/init/model.layers.10.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:95582952b08713e8757ec74a1eee52744085589fe4894deff166fece14e1499d
3
+ size 11395
params/phi/8/ones_t/comb_12/init/model.layers.11.mlp.fc1/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
3
+ size 42115
params/phi/8/ones_t/comb_12/init/model.layers.11.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40f14e644eeed920065fc290cc06c44717e6abd381dd9f47817a6f022b3dd50d
3
+ size 42115
params/phi/8/ones_t/comb_12/init/model.layers.11.mlp.fc2/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_12/init/model.layers.11.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7bbee1a235d05667ea42426bcefbe1f0d836cd80aa278661b2c82e803afd4e45
3
+ size 11395
params/phi/8/ones_t/comb_12/init/model.layers.11.self_attn.dense/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_12/init/model.layers.11.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40bac8b07fadc8bdde107e80953b031d3102eacbccf2bcd54dedc5840970679a
3
+ size 11395
params/phi/8/ones_t/comb_12/init/model.layers.11.self_attn.k_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_12/init/model.layers.11.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:54872d3d5a5460da3b870e02537044a9fadbb86dd855778b98721d66f57915d3
3
+ size 11395
params/phi/8/ones_t/comb_12/init/model.layers.11.self_attn.q_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_12/init/model.layers.11.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26f90fb808d7b92529275823f19f55498f87039f8421814643ec54f4c239261b
3
+ size 11395
params/phi/8/ones_t/comb_12/init/model.layers.11.self_attn.v_proj/_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
3
+ size 11395
params/phi/8/ones_t/comb_12/init/model.layers.11.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5bdfcc7f4eff6b574b4071580826f343705496ffce7863c5330516c7fca0134
3
+ size 11395