Diogo-V commited on
Commit
4c85fee
1 Parent(s): f00c206

Adding more results

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. params/phi/8/ones_t/comb_13/init/lm_head/_s.pt +3 -0
  2. params/phi/8/ones_t/comb_13/init/model.layers.0.mlp.fc1/_s.pt +3 -0
  3. params/phi/8/ones_t/comb_13/init/model.layers.0.mlp.fc2/_s.pt +3 -0
  4. params/phi/8/ones_t/comb_13/init/model.layers.0.self_attn.dense/_s.pt +3 -0
  5. params/phi/8/ones_t/comb_13/init/model.layers.0.self_attn.k_proj/_s.pt +3 -0
  6. params/phi/8/ones_t/comb_13/init/model.layers.0.self_attn.q_proj/_s.pt +3 -0
  7. params/phi/8/ones_t/comb_13/init/model.layers.0.self_attn.v_proj/_s.pt +3 -0
  8. params/phi/8/ones_t/comb_13/init/model.layers.1.mlp.fc1/_s.pt +3 -0
  9. params/phi/8/ones_t/comb_13/init/model.layers.1.mlp.fc2/_s.pt +3 -0
  10. params/phi/8/ones_t/comb_13/init/model.layers.1.self_attn.dense/_s.pt +3 -0
  11. params/phi/8/ones_t/comb_13/init/model.layers.1.self_attn.k_proj/_s.pt +3 -0
  12. params/phi/8/ones_t/comb_13/init/model.layers.1.self_attn.q_proj/_s.pt +3 -0
  13. params/phi/8/ones_t/comb_13/init/model.layers.1.self_attn.v_proj/_s.pt +3 -0
  14. params/phi/8/ones_t/comb_13/init/model.layers.10.mlp.fc1/_s.pt +3 -0
  15. params/phi/8/ones_t/comb_13/init/model.layers.10.mlp.fc2/_s.pt +3 -0
  16. params/phi/8/ones_t/comb_13/init/model.layers.10.self_attn.dense/_s.pt +3 -0
  17. params/phi/8/ones_t/comb_13/init/model.layers.10.self_attn.k_proj/_s.pt +3 -0
  18. params/phi/8/ones_t/comb_13/init/model.layers.10.self_attn.q_proj/_s.pt +3 -0
  19. params/phi/8/ones_t/comb_13/init/model.layers.10.self_attn.v_proj/_s.pt +3 -0
  20. params/phi/8/ones_t/comb_13/init/model.layers.11.mlp.fc1/_s.pt +3 -0
  21. params/phi/8/ones_t/comb_13/init/model.layers.11.mlp.fc2/_s.pt +3 -0
  22. params/phi/8/ones_t/comb_13/init/model.layers.11.self_attn.dense/_s.pt +3 -0
  23. params/phi/8/ones_t/comb_13/init/model.layers.11.self_attn.k_proj/_s.pt +3 -0
  24. params/phi/8/ones_t/comb_13/init/model.layers.11.self_attn.q_proj/_s.pt +3 -0
  25. params/phi/8/ones_t/comb_13/init/model.layers.11.self_attn.v_proj/_s.pt +3 -0
  26. params/phi/8/ones_t/comb_13/init/model.layers.12.mlp.fc1/_s.pt +3 -0
  27. params/phi/8/ones_t/comb_13/init/model.layers.12.mlp.fc2/_s.pt +3 -0
  28. params/phi/8/ones_t/comb_13/init/model.layers.12.self_attn.dense/_s.pt +3 -0
  29. params/phi/8/ones_t/comb_13/init/model.layers.12.self_attn.k_proj/_s.pt +3 -0
  30. params/phi/8/ones_t/comb_13/init/model.layers.12.self_attn.q_proj/_s.pt +3 -0
  31. params/phi/8/ones_t/comb_13/init/model.layers.12.self_attn.v_proj/_s.pt +3 -0
  32. params/phi/8/ones_t/comb_13/init/model.layers.13.mlp.fc1/_s.pt +3 -0
  33. params/phi/8/ones_t/comb_13/init/model.layers.13.mlp.fc2/_s.pt +3 -0
  34. params/phi/8/ones_t/comb_13/init/model.layers.13.self_attn.dense/_s.pt +3 -0
  35. params/phi/8/ones_t/comb_13/init/model.layers.13.self_attn.k_proj/_s.pt +3 -0
  36. params/phi/8/ones_t/comb_13/init/model.layers.13.self_attn.q_proj/_s.pt +3 -0
  37. params/phi/8/ones_t/comb_13/init/model.layers.13.self_attn.v_proj/_s.pt +3 -0
  38. params/phi/8/ones_t/comb_13/init/model.layers.14.mlp.fc1/_s.pt +3 -0
  39. params/phi/8/ones_t/comb_13/init/model.layers.14.mlp.fc2/_s.pt +3 -0
  40. params/phi/8/ones_t/comb_13/init/model.layers.14.self_attn.dense/_s.pt +3 -0
  41. params/phi/8/ones_t/comb_13/init/model.layers.14.self_attn.k_proj/_s.pt +3 -0
  42. params/phi/8/ones_t/comb_13/init/model.layers.14.self_attn.q_proj/_s.pt +3 -0
  43. params/phi/8/ones_t/comb_13/init/model.layers.14.self_attn.v_proj/_s.pt +3 -0
  44. params/phi/8/ones_t/comb_13/init/model.layers.15.mlp.fc1/_s.pt +3 -0
  45. params/phi/8/ones_t/comb_13/init/model.layers.15.mlp.fc2/_s.pt +3 -0
  46. params/phi/8/ones_t/comb_13/init/model.layers.15.self_attn.dense/_s.pt +3 -0
  47. params/phi/8/ones_t/comb_13/init/model.layers.15.self_attn.k_proj/_s.pt +3 -0
  48. params/phi/8/ones_t/comb_13/init/model.layers.15.self_attn.q_proj/_s.pt +3 -0
  49. params/phi/8/ones_t/comb_13/init/model.layers.15.self_attn.v_proj/_s.pt +3 -0
  50. params/phi/8/ones_t/comb_13/init/model.layers.16.mlp.fc1/_s.pt +3 -0
params/phi/8/ones_t/comb_13/init/lm_head/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0613c5da1d73e707f7537ab833432f9bf4d0e331d2790ad56ecf3f90f066c949
3
+ size 205955
params/phi/8/ones_t/comb_13/init/model.layers.0.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:22dd0637f1f26f4b1c1e5389ebd5b8c4e34408dad0dfc969f434246224551fd4
3
+ size 42115
params/phi/8/ones_t/comb_13/init/model.layers.0.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3d4725a842b07e1bbe736228771eb92e875fc923b353823c5124ff03c72a8019
3
+ size 11395
params/phi/8/ones_t/comb_13/init/model.layers.0.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e667894e9bfa6d2f2e897642ae68bacd0516430957415bd15db1dfbbe89792a
3
+ size 11395
params/phi/8/ones_t/comb_13/init/model.layers.0.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dfb98f9165c78d24316cbb5d13b0bea986191ea71e376120f78998b8e0dcc3fc
3
+ size 11395
params/phi/8/ones_t/comb_13/init/model.layers.0.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93c9b64a4f02e091ac587173b8a1af4490cf86353289ac92332445128f9b8154
3
+ size 11395
params/phi/8/ones_t/comb_13/init/model.layers.0.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e1a3db66c95603806ab016e9d29a887ebbcdfa6de0686b9e577da36bb781cf7
3
+ size 11395
params/phi/8/ones_t/comb_13/init/model.layers.1.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:543355d9f167b7058fed5164238738abf98555ad015c080d5ecae9dba058d092
3
+ size 42115
params/phi/8/ones_t/comb_13/init/model.layers.1.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0108a2a4d791b9a85d3a67cdf2f2294c3313a060c0b4f19363fea12bf39ba111
3
+ size 11395
params/phi/8/ones_t/comb_13/init/model.layers.1.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05fc40c20b2af3943a43e3fa2444aa47414ab7fcec4ab1041a8b2bdd2239ed03
3
+ size 11395
params/phi/8/ones_t/comb_13/init/model.layers.1.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0fa274a19a7f01649d2a33ed0f360608dfdba1a94b5d8e9a9003aada3787ad28
3
+ size 11395
params/phi/8/ones_t/comb_13/init/model.layers.1.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8fc49e9f79fa5a8c4e62f2f2614ba1f70ca681fd0860f3f4b3a7a53c431148ae
3
+ size 11395
params/phi/8/ones_t/comb_13/init/model.layers.1.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dad7ed56e9e635880f4cd2c48e2a912e7900a96148202ac7cb527578ee661676
3
+ size 11395
params/phi/8/ones_t/comb_13/init/model.layers.10.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2744063fec7a3a901708bd27dac21faeaa38f9813a1f5442d21b6e9ab388dd5b
3
+ size 42115
params/phi/8/ones_t/comb_13/init/model.layers.10.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f72996c1e9cc61945d8a43da324812a67372cc6156188d872a232e8f6c88f447
3
+ size 11395
params/phi/8/ones_t/comb_13/init/model.layers.10.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac19c9cb0d4598a4e5430253890f612612120b2ffc37dcd8d16c792df8067893
3
+ size 11395
params/phi/8/ones_t/comb_13/init/model.layers.10.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25e7f973937a125e51344541f5ac8ba4ae6e9fd73271a325bd652f7d11a6d3d8
3
+ size 11395
params/phi/8/ones_t/comb_13/init/model.layers.10.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f3325a089fe9f65f55a5811b4685f99cf4cd6482c493868075f6ace2b6ae2e1
3
+ size 11395
params/phi/8/ones_t/comb_13/init/model.layers.10.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c41d20566e8aeac8700f3ce81e0710bc76aa0b8771035969dc2c5ee1f3863ff9
3
+ size 11395
params/phi/8/ones_t/comb_13/init/model.layers.11.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fde3a4385e3abd353afb8177f9e416501ef80b634c2c9299049d8ba3faf1e178
3
+ size 42115
params/phi/8/ones_t/comb_13/init/model.layers.11.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af1faba0083d93476ca31ee820e2422d7331bc8df8ea7fbbb18adc4769ea5545
3
+ size 11395
params/phi/8/ones_t/comb_13/init/model.layers.11.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a19488415b1256c66024a7ab923924cea3189b5b9218672ddc8e84404a8f00c
3
+ size 11395
params/phi/8/ones_t/comb_13/init/model.layers.11.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb6ad6b51f6437312d72ee1250430a2e6370d68eb94883659ea244744be8d4f4
3
+ size 11395
params/phi/8/ones_t/comb_13/init/model.layers.11.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a303939dc50c64b8c4896502008bc6df8053f0446a96f494ae0a7935fecd639
3
+ size 11395
params/phi/8/ones_t/comb_13/init/model.layers.11.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:94dae00e7f65e8f709a0b17e3d4c731fba924583bdd100f008fd3eb60bd11674
3
+ size 11395
params/phi/8/ones_t/comb_13/init/model.layers.12.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf9b1155f5088616fecaa96847f2796d2f162c4314c58ea4ea957d5aa6aff57b
3
+ size 42115
params/phi/8/ones_t/comb_13/init/model.layers.12.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8642ae0618d97138851680c72bf025445ec5f18bac7e790183a04b66c028c87
3
+ size 11395
params/phi/8/ones_t/comb_13/init/model.layers.12.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:797e787b6a03a9f45778e46aea957aa1d7818a82e5337d6659d953f82ff3ab49
3
+ size 11395
params/phi/8/ones_t/comb_13/init/model.layers.12.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40015033efab24921f0fa3bef686b9b0c49e9e6cada85a9e48c7be3cab56fa07
3
+ size 11395
params/phi/8/ones_t/comb_13/init/model.layers.12.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96af2fcced4ba621def7b2cf63a9361f5392b8573372674afb500bd49a90f5bd
3
+ size 11395
params/phi/8/ones_t/comb_13/init/model.layers.12.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d4e614966309b505bbe72b8a283c84e4e9eae3f1ac884cae55d34d512b67856c
3
+ size 11395
params/phi/8/ones_t/comb_13/init/model.layers.13.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b03e1f1cabf9d44a774d00523a9630e88372be0f47c418a7893065626e68e45
3
+ size 42115
params/phi/8/ones_t/comb_13/init/model.layers.13.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5843dc60b99fe07f829a09799256dedde65e6fe0b52c43ceae1740068ff6243a
3
+ size 11395
params/phi/8/ones_t/comb_13/init/model.layers.13.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba36306ed9cb03f400ffc2c4d7473eb408eba79823eac86578d5f2e18ada018e
3
+ size 11395
params/phi/8/ones_t/comb_13/init/model.layers.13.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:522112dd952c42c219d25cb25ddd26e3a1761758f197bb4532bbc5be5a9c5331
3
+ size 11395
params/phi/8/ones_t/comb_13/init/model.layers.13.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:adbf879e9042ca074e1a8ba3cc5a5d1756616c133e5ab59135b457d3936117ce
3
+ size 11395
params/phi/8/ones_t/comb_13/init/model.layers.13.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f285548d9c6dc24eca2a5ac2bef372eb52055906685c3268494fbd54e13b0507
3
+ size 11395
params/phi/8/ones_t/comb_13/init/model.layers.14.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6878875c71ff5a84591e1386323e0556ff5c59a59e6cf85bd6f7e254bcff0756
3
+ size 42115
params/phi/8/ones_t/comb_13/init/model.layers.14.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d6a9b4bde1669169451ee2eaf86b7f32abb773e5a2b7a461f9f6c7f6fca3b11
3
+ size 11395
params/phi/8/ones_t/comb_13/init/model.layers.14.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:217dac1b20db280e25fe20099303da8aef9003d01e8a2e627a5e7333b7943aa1
3
+ size 11395
params/phi/8/ones_t/comb_13/init/model.layers.14.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aebe9b2d5423698f95e46c7d18d90bf2f8268828032ff737aa2f11b18e3c2d1b
3
+ size 11395
params/phi/8/ones_t/comb_13/init/model.layers.14.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a5359d0683e15e934b9e6d8caf88876f9eec373510381d389c7c230a6231278
3
+ size 11395
params/phi/8/ones_t/comb_13/init/model.layers.14.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b8fdffa6b60fa3408490632cb8f85866ce6fa047472020879b4bf7c42d39ae4
3
+ size 11395
params/phi/8/ones_t/comb_13/init/model.layers.15.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c3b2f227e4da1867db81ccdd53a3f268b4b4a766189a344f2c820f160d29670
3
+ size 42115
params/phi/8/ones_t/comb_13/init/model.layers.15.mlp.fc2/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8da8a6346a0f28896b4720432925b00f03d225227e0247d390f40ee5db7d13a6
3
+ size 11395
params/phi/8/ones_t/comb_13/init/model.layers.15.self_attn.dense/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5bb01f536b3eddef5b2459183ae18a4de36d91bf39525fc20e055394bcbe4ca6
3
+ size 11395
params/phi/8/ones_t/comb_13/init/model.layers.15.self_attn.k_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a320a632e4e70690833abafcf055a1c67953106be4fa4b30e9b28f9cf7f34283
3
+ size 11395
params/phi/8/ones_t/comb_13/init/model.layers.15.self_attn.q_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e77ace907dd4ac1b36ea02bb068dc24c8e13d1f6d372e7b7cc4765c7ee2e5ddc
3
+ size 11395
params/phi/8/ones_t/comb_13/init/model.layers.15.self_attn.v_proj/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9dc346e7dabed1d99240a0cfcd18c364b8da8a4101ac2c760555495573c18f6c
3
+ size 11395
params/phi/8/ones_t/comb_13/init/model.layers.16.mlp.fc1/_s.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2189338494a9bff0538b9128674574ab4b544bc5f0873f6d6a7efd11bf0e7b1
3
+ size 42115