aapot commited on
Commit
dfb92c4
1 Parent(s): 9da74e0

Add 500k train step and HF flax model

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. checkpoint_500000/checkpoint +3 -0
  2. checkpoint_500000/state.param_states.decoder.decoder_norm.scale.v/.zarray +3 -0
  3. checkpoint_500000/state.param_states.decoder.decoder_norm.scale.v/0 +3 -0
  4. checkpoint_500000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  5. checkpoint_500000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  6. checkpoint_500000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  7. checkpoint_500000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/0 +3 -0
  8. checkpoint_500000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  9. checkpoint_500000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/0 +3 -0
  10. checkpoint_500000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  11. checkpoint_500000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  12. checkpoint_500000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  13. checkpoint_500000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/0 +3 -0
  14. checkpoint_500000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  15. checkpoint_500000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/0 +3 -0
  16. checkpoint_500000/state.param_states.decoder.layers_10.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  17. checkpoint_500000/state.param_states.decoder.layers_10.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  18. checkpoint_500000/state.param_states.decoder.layers_10.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  19. checkpoint_500000/state.param_states.decoder.layers_10.pre_mlp_layer_norm.scale.v/0 +3 -0
  20. checkpoint_500000/state.param_states.decoder.layers_10.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  21. checkpoint_500000/state.param_states.decoder.layers_10.pre_self_attention_layer_norm.scale.v/0 +3 -0
  22. checkpoint_500000/state.param_states.decoder.layers_11.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  23. checkpoint_500000/state.param_states.decoder.layers_11.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  24. checkpoint_500000/state.param_states.decoder.layers_11.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  25. checkpoint_500000/state.param_states.decoder.layers_11.pre_mlp_layer_norm.scale.v/0 +3 -0
  26. checkpoint_500000/state.param_states.decoder.layers_11.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  27. checkpoint_500000/state.param_states.decoder.layers_11.pre_self_attention_layer_norm.scale.v/0 +3 -0
  28. checkpoint_500000/state.param_states.decoder.layers_12.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  29. checkpoint_500000/state.param_states.decoder.layers_12.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  30. checkpoint_500000/state.param_states.decoder.layers_12.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  31. checkpoint_500000/state.param_states.decoder.layers_12.pre_mlp_layer_norm.scale.v/0 +3 -0
  32. checkpoint_500000/state.param_states.decoder.layers_12.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  33. checkpoint_500000/state.param_states.decoder.layers_12.pre_self_attention_layer_norm.scale.v/0 +3 -0
  34. checkpoint_500000/state.param_states.decoder.layers_13.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  35. checkpoint_500000/state.param_states.decoder.layers_13.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  36. checkpoint_500000/state.param_states.decoder.layers_13.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  37. checkpoint_500000/state.param_states.decoder.layers_13.pre_mlp_layer_norm.scale.v/0 +3 -0
  38. checkpoint_500000/state.param_states.decoder.layers_13.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  39. checkpoint_500000/state.param_states.decoder.layers_13.pre_self_attention_layer_norm.scale.v/0 +3 -0
  40. checkpoint_500000/state.param_states.decoder.layers_14.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  41. checkpoint_500000/state.param_states.decoder.layers_14.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  42. checkpoint_500000/state.param_states.decoder.layers_14.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  43. checkpoint_500000/state.param_states.decoder.layers_14.pre_mlp_layer_norm.scale.v/0 +3 -0
  44. checkpoint_500000/state.param_states.decoder.layers_14.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  45. checkpoint_500000/state.param_states.decoder.layers_14.pre_self_attention_layer_norm.scale.v/0 +3 -0
  46. checkpoint_500000/state.param_states.decoder.layers_15.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  47. checkpoint_500000/state.param_states.decoder.layers_15.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  48. checkpoint_500000/state.param_states.decoder.layers_15.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  49. checkpoint_500000/state.param_states.decoder.layers_15.pre_mlp_layer_norm.scale.v/0 +3 -0
  50. checkpoint_500000/state.param_states.decoder.layers_15.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
checkpoint_500000/checkpoint ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c397311bf0313ee71b947ba36bd7f763d2943703776564773467396d8c3f524c
3
+ size 6520637
checkpoint_500000/state.param_states.decoder.decoder_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
3
+ size 168
checkpoint_500000/state.param_states.decoder.decoder_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2269862cdedcdc3b1d80c61a1c305b4242b395d6fab667a9808ca9506d10598
3
+ size 2663
checkpoint_500000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
3
+ size 168
checkpoint_500000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ad7f3c9d5b03cab04e413775b8e77213fc37e8e92d58aed6366df34bc7df855d
3
+ size 2848
checkpoint_500000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
3
+ size 168
checkpoint_500000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9e79b1c2e31996cecabc8f756bd1b1e62c1f51288d3c44dcfee4b1506ce35c0
3
+ size 2863
checkpoint_500000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
3
+ size 168
checkpoint_500000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78d2fc2564bfae125584d64fd5c62ae3e5cf18d9615864de9b204027da9f3629
3
+ size 2859
checkpoint_500000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
3
+ size 168
checkpoint_500000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b8e3c0e0683922bbf1882f4f4c418c68287ef3df331e920880a32716b5bd9b27
3
+ size 2825
checkpoint_500000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
3
+ size 168
checkpoint_500000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1a585762755f2842efd498165974a171057662a8ade84d2025709f70da2955f
3
+ size 2855
checkpoint_500000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
3
+ size 168
checkpoint_500000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3fb07b004dd5db951c7664e3b7c4245f30ec87b870644ea94b80874b5e7e2fdb
3
+ size 2878
checkpoint_500000/state.param_states.decoder.layers_10.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
3
+ size 168
checkpoint_500000/state.param_states.decoder.layers_10.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47dc52144c27d8120e854d49dc4982d002c010747c388469a3f8811c622534d1
3
+ size 2859
checkpoint_500000/state.param_states.decoder.layers_10.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
3
+ size 168
checkpoint_500000/state.param_states.decoder.layers_10.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ab6a8119aa973d97cfcbcb96356ad7f3043131fd6e8d32d7621e1b42a7989eb
3
+ size 2866
checkpoint_500000/state.param_states.decoder.layers_10.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
3
+ size 168
checkpoint_500000/state.param_states.decoder.layers_10.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8bc6f4ce4ccc1de626dcaedac277eeb2d59185cb56e74633b8b7bafc6991c632
3
+ size 2863
checkpoint_500000/state.param_states.decoder.layers_11.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
3
+ size 168
checkpoint_500000/state.param_states.decoder.layers_11.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:655c69538923f24cfc7fd42a2e5070631be176b2d147fb7ee1d9446b8dc0586c
3
+ size 2822
checkpoint_500000/state.param_states.decoder.layers_11.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
3
+ size 168
checkpoint_500000/state.param_states.decoder.layers_11.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d8faa2a3d98116571a0c9a6ed3efb4dae880cb10d7f9f5f0c3812433507fa9e
3
+ size 2841
checkpoint_500000/state.param_states.decoder.layers_11.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
3
+ size 168
checkpoint_500000/state.param_states.decoder.layers_11.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c835dbe4bc591d6b1370a97df295e1b994688e3c761aa51713f88b5da4e3ad82
3
+ size 2880
checkpoint_500000/state.param_states.decoder.layers_12.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
3
+ size 168
checkpoint_500000/state.param_states.decoder.layers_12.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d43b5bcb1216775173e61d82fdf951f4a4e1b2eed0268d1dd80eb3bfd28433e
3
+ size 2855
checkpoint_500000/state.param_states.decoder.layers_12.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
3
+ size 168
checkpoint_500000/state.param_states.decoder.layers_12.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ae0b5aa6b3aac5cc258e451dfa9de52061baf172a7a0cc7f848b873c1ff060c
3
+ size 2863
checkpoint_500000/state.param_states.decoder.layers_12.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
3
+ size 168
checkpoint_500000/state.param_states.decoder.layers_12.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7fdf37fbe34d94c07e759142e1067287a94e332f89319397cb50f3ff5fbee79
3
+ size 2852
checkpoint_500000/state.param_states.decoder.layers_13.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
3
+ size 168
checkpoint_500000/state.param_states.decoder.layers_13.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fccecf58c439a4d698ca909053159cfb456e9f55bd1197ad0dc7aeb91f07c1ae
3
+ size 2866
checkpoint_500000/state.param_states.decoder.layers_13.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
3
+ size 168
checkpoint_500000/state.param_states.decoder.layers_13.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7cb3fcf36d28187eeacd86315cf049dad26b9d625e4aae01be7117b98e93ed50
3
+ size 2877
checkpoint_500000/state.param_states.decoder.layers_13.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
3
+ size 168
checkpoint_500000/state.param_states.decoder.layers_13.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f76f8e85b04b99cd5cc63023eec09549f740eadad1440b68ef7afdb48c28c339
3
+ size 2849
checkpoint_500000/state.param_states.decoder.layers_14.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
3
+ size 168
checkpoint_500000/state.param_states.decoder.layers_14.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ddbb71e204d53e060c8b9bf20f097a80b461d0792e3c4fa8a6fcad9c55280c0
3
+ size 2768
checkpoint_500000/state.param_states.decoder.layers_14.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
3
+ size 168
checkpoint_500000/state.param_states.decoder.layers_14.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a366187927da1471e390f7fa8f828fb6c311184b976b88c3f9a617b296e8687
3
+ size 2842
checkpoint_500000/state.param_states.decoder.layers_14.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
3
+ size 168
checkpoint_500000/state.param_states.decoder.layers_14.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e87ae558d06dbb837dc0e2a1483b46c951ef3a07a5909339ca1f406cb3fc6bf8
3
+ size 2897
checkpoint_500000/state.param_states.decoder.layers_15.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
3
+ size 168
checkpoint_500000/state.param_states.decoder.layers_15.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:201982a00c17b550085040b350072ad3ebdc5f694c9bf2020cdfc548096e5f82
3
+ size 2788
checkpoint_500000/state.param_states.decoder.layers_15.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
3
+ size 168
checkpoint_500000/state.param_states.decoder.layers_15.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32e3b6c2880651541cc4bf1448d7a41ca3e8dd35305f1e88051e57716c8f9f19
3
+ size 2833
checkpoint_500000/state.param_states.decoder.layers_15.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
3
+ size 168