aapot commited on
Commit
bad1e66
1 Parent(s): 3bc5dc7

Add 1100k train step and HF flax model

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. checkpoint_1100000/checkpoint +3 -0
  2. checkpoint_1100000/state.param_states.decoder.decoder_norm.scale.v/.zarray +3 -0
  3. checkpoint_1100000/state.param_states.decoder.decoder_norm.scale.v/0 +3 -0
  4. checkpoint_1100000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  5. checkpoint_1100000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  6. checkpoint_1100000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  7. checkpoint_1100000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/0 +3 -0
  8. checkpoint_1100000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  9. checkpoint_1100000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/0 +3 -0
  10. checkpoint_1100000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  11. checkpoint_1100000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  12. checkpoint_1100000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  13. checkpoint_1100000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/0 +3 -0
  14. checkpoint_1100000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  15. checkpoint_1100000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/0 +3 -0
  16. checkpoint_1100000/state.param_states.decoder.layers_10.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  17. checkpoint_1100000/state.param_states.decoder.layers_10.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  18. checkpoint_1100000/state.param_states.decoder.layers_10.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  19. checkpoint_1100000/state.param_states.decoder.layers_10.pre_mlp_layer_norm.scale.v/0 +3 -0
  20. checkpoint_1100000/state.param_states.decoder.layers_10.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  21. checkpoint_1100000/state.param_states.decoder.layers_10.pre_self_attention_layer_norm.scale.v/0 +3 -0
  22. checkpoint_1100000/state.param_states.decoder.layers_11.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  23. checkpoint_1100000/state.param_states.decoder.layers_11.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  24. checkpoint_1100000/state.param_states.decoder.layers_11.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  25. checkpoint_1100000/state.param_states.decoder.layers_11.pre_mlp_layer_norm.scale.v/0 +3 -0
  26. checkpoint_1100000/state.param_states.decoder.layers_11.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  27. checkpoint_1100000/state.param_states.decoder.layers_11.pre_self_attention_layer_norm.scale.v/0 +3 -0
  28. checkpoint_1100000/state.param_states.decoder.layers_12.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  29. checkpoint_1100000/state.param_states.decoder.layers_12.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  30. checkpoint_1100000/state.param_states.decoder.layers_12.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  31. checkpoint_1100000/state.param_states.decoder.layers_12.pre_mlp_layer_norm.scale.v/0 +3 -0
  32. checkpoint_1100000/state.param_states.decoder.layers_12.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  33. checkpoint_1100000/state.param_states.decoder.layers_12.pre_self_attention_layer_norm.scale.v/0 +3 -0
  34. checkpoint_1100000/state.param_states.decoder.layers_13.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  35. checkpoint_1100000/state.param_states.decoder.layers_13.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  36. checkpoint_1100000/state.param_states.decoder.layers_13.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  37. checkpoint_1100000/state.param_states.decoder.layers_13.pre_mlp_layer_norm.scale.v/0 +3 -0
  38. checkpoint_1100000/state.param_states.decoder.layers_13.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  39. checkpoint_1100000/state.param_states.decoder.layers_13.pre_self_attention_layer_norm.scale.v/0 +3 -0
  40. checkpoint_1100000/state.param_states.decoder.layers_14.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  41. checkpoint_1100000/state.param_states.decoder.layers_14.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  42. checkpoint_1100000/state.param_states.decoder.layers_14.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  43. checkpoint_1100000/state.param_states.decoder.layers_14.pre_mlp_layer_norm.scale.v/0 +3 -0
  44. checkpoint_1100000/state.param_states.decoder.layers_14.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  45. checkpoint_1100000/state.param_states.decoder.layers_14.pre_self_attention_layer_norm.scale.v/0 +3 -0
  46. checkpoint_1100000/state.param_states.decoder.layers_15.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  47. checkpoint_1100000/state.param_states.decoder.layers_15.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  48. checkpoint_1100000/state.param_states.decoder.layers_15.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  49. checkpoint_1100000/state.param_states.decoder.layers_15.pre_mlp_layer_norm.scale.v/0 +3 -0
  50. checkpoint_1100000/state.param_states.decoder.layers_15.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
checkpoint_1100000/checkpoint ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1a4f7eaf2c99e3eda5a859f877038252b40b890393385d1c4d0dd59f6c62cfb
3
+ size 8513341
checkpoint_1100000/state.param_states.decoder.decoder_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_1100000/state.param_states.decoder.decoder_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c92723d8427e9c724d3c51264362cb8a0b7cc2e595ca3242ede50e6d321b3ec4
3
+ size 3683
checkpoint_1100000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_1100000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30e98d8275db1e77d7a2d430c067e0cbc535581d812b71b90cbfbb63b2500a19
3
+ size 3663
checkpoint_1100000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_1100000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a5e96bd9da2ca50a1b8971a472e6db343f8f62da2aaa31c342f5d8484f305ec
3
+ size 3441
checkpoint_1100000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_1100000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c6d04c30d2861180da47c41b9ff17a028bf22db10766985a09f333f1e9005cc8
3
+ size 3572
checkpoint_1100000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_1100000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4baf9c64a05bdd39b79cfe18ffd38c07be896728520c7cd3f5ee1bb46b9fefe1
3
+ size 3587
checkpoint_1100000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_1100000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:719ccfcffabcae371f8a0052d469e5ddf15f4eeb845f4fc47d6c64e8eea25a83
3
+ size 3490
checkpoint_1100000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_1100000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec20682446566c1ae3368d334149042d1ed1808d0cbcab646be6e3f04431a2c0
3
+ size 3703
checkpoint_1100000/state.param_states.decoder.layers_10.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_1100000/state.param_states.decoder.layers_10.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f63aaa6cf721c40744b4872d4d996ffc73384d9de3ac360cf10f2d19a5367919
3
+ size 3617
checkpoint_1100000/state.param_states.decoder.layers_10.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_1100000/state.param_states.decoder.layers_10.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56dfa17d7b2287d35dfe031ab3ac4ba94899b5b3fc646408de92c98c1281e411
3
+ size 3643
checkpoint_1100000/state.param_states.decoder.layers_10.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_1100000/state.param_states.decoder.layers_10.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c24bbeb81b042b027151404618ba413a55e00c8b96468f2c3d29635260c701c2
3
+ size 3686
checkpoint_1100000/state.param_states.decoder.layers_11.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_1100000/state.param_states.decoder.layers_11.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eee29ac6024fca134b9055eb0ad5185427bd084b654ea1c03dc7375dcac813a7
3
+ size 3600
checkpoint_1100000/state.param_states.decoder.layers_11.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_1100000/state.param_states.decoder.layers_11.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67f73ae5fbb5b1ce12823243ac5222f04bce1bd53db3e47a78cce6b04baa5b8c
3
+ size 3643
checkpoint_1100000/state.param_states.decoder.layers_11.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_1100000/state.param_states.decoder.layers_11.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:906575ea71e199ce21ac288ebaa62a4d9ab8775421e2f292b355c5dc11fc94c6
3
+ size 3583
checkpoint_1100000/state.param_states.decoder.layers_12.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_1100000/state.param_states.decoder.layers_12.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0282eaa53de586ca15441fe97c4cdcb4735eacf4c08e745e60adeab948dabb97
3
+ size 3666
checkpoint_1100000/state.param_states.decoder.layers_12.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_1100000/state.param_states.decoder.layers_12.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85a94ec4c32ce81d6a6f1bb0203d61da7b5a75f280de0a60cf14c9555a5639c4
3
+ size 3643
checkpoint_1100000/state.param_states.decoder.layers_12.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_1100000/state.param_states.decoder.layers_12.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d789057f839ee716f8e3bed837cb3f55dd26909ece04b1f830aa80a97fc3596
3
+ size 3600
checkpoint_1100000/state.param_states.decoder.layers_13.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_1100000/state.param_states.decoder.layers_13.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7eb5a9cf9b7eab93e1e385940c74f8ed6c1f160bf1f76f132067912775abb216
3
+ size 3637
checkpoint_1100000/state.param_states.decoder.layers_13.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_1100000/state.param_states.decoder.layers_13.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78bc3d6f87d109af72c46b2f6905aeab4a3ca7eedf81d4665d7cdccd8b8f71d0
3
+ size 3638
checkpoint_1100000/state.param_states.decoder.layers_13.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_1100000/state.param_states.decoder.layers_13.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa2fab69d2f9ec00b199994cb0d6405682e83e61dc9254f036b52e59c549d97d
3
+ size 3656
checkpoint_1100000/state.param_states.decoder.layers_14.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_1100000/state.param_states.decoder.layers_14.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db77059448024588d68777ce3a02780f0632695d294c9e85507b64e567e09bb0
3
+ size 3585
checkpoint_1100000/state.param_states.decoder.layers_14.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_1100000/state.param_states.decoder.layers_14.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d3a85a53e32ea4a9ece175cca780088613574f3c5ef62f42bb770cb8e5a17957
3
+ size 3635
checkpoint_1100000/state.param_states.decoder.layers_14.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_1100000/state.param_states.decoder.layers_14.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7704a920f4f2e0deb1eeb1960add5a841e806edd05f40297ae8644cd38bc24e4
3
+ size 3587
checkpoint_1100000/state.param_states.decoder.layers_15.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_1100000/state.param_states.decoder.layers_15.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:12284b62435755be86e5cbd455d9d3f3e862f93c665a0c88dbdd4a926dc9b7df
3
+ size 3668
checkpoint_1100000/state.param_states.decoder.layers_15.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_1100000/state.param_states.decoder.layers_15.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ed03bd64320c9a73d7c777cab3333f8fd2e5c60509834c6eeff8a45734a7505
3
+ size 3596
checkpoint_1100000/state.param_states.decoder.layers_15.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170