aapot commited on
Commit
ef33930
1 Parent(s): 7f944aa

Add 500k train step and HF flax model

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. checkpoint_500000/checkpoint +3 -0
  2. checkpoint_500000/state.param_states.decoder.decoder_norm.scale.v/.zarray +3 -0
  3. checkpoint_500000/state.param_states.decoder.decoder_norm.scale.v/0 +3 -0
  4. checkpoint_500000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  5. checkpoint_500000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  6. checkpoint_500000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  7. checkpoint_500000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/0 +3 -0
  8. checkpoint_500000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  9. checkpoint_500000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/0 +3 -0
  10. checkpoint_500000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  11. checkpoint_500000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  12. checkpoint_500000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  13. checkpoint_500000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/0 +3 -0
  14. checkpoint_500000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  15. checkpoint_500000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/0 +3 -0
  16. checkpoint_500000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  17. checkpoint_500000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  18. checkpoint_500000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  19. checkpoint_500000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/0 +3 -0
  20. checkpoint_500000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  21. checkpoint_500000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/0 +3 -0
  22. checkpoint_500000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  23. checkpoint_500000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  24. checkpoint_500000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  25. checkpoint_500000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/0 +3 -0
  26. checkpoint_500000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  27. checkpoint_500000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/0 +3 -0
  28. checkpoint_500000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  29. checkpoint_500000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  30. checkpoint_500000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  31. checkpoint_500000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/0 +3 -0
  32. checkpoint_500000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  33. checkpoint_500000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/0 +3 -0
  34. checkpoint_500000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  35. checkpoint_500000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  36. checkpoint_500000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  37. checkpoint_500000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/0 +3 -0
  38. checkpoint_500000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  39. checkpoint_500000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/0 +3 -0
  40. checkpoint_500000/state.param_states.decoder.relpos_bias.rel_embedding.v/.zarray +3 -0
  41. checkpoint_500000/state.param_states.decoder.relpos_bias.rel_embedding.v/0.0 +3 -0
  42. checkpoint_500000/state.param_states.encoder.encoder_norm.scale.v/.zarray +3 -0
  43. checkpoint_500000/state.param_states.encoder.encoder_norm.scale.v/0 +3 -0
  44. checkpoint_500000/state.param_states.encoder.layers_0.pre_attention_layer_norm.scale.v/.zarray +3 -0
  45. checkpoint_500000/state.param_states.encoder.layers_0.pre_attention_layer_norm.scale.v/0 +3 -0
  46. checkpoint_500000/state.param_states.encoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  47. checkpoint_500000/state.param_states.encoder.layers_0.pre_mlp_layer_norm.scale.v/0 +3 -0
  48. checkpoint_500000/state.param_states.encoder.layers_1.pre_attention_layer_norm.scale.v/.zarray +3 -0
  49. checkpoint_500000/state.param_states.encoder.layers_1.pre_attention_layer_norm.scale.v/0 +3 -0
  50. checkpoint_500000/state.param_states.encoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray +3 -0
checkpoint_500000/checkpoint ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c4873466081ff7f11f6f484a2291de99e0b78667b384ae71d228735e2f6d208b
3
+ size 640339
checkpoint_500000/state.param_states.decoder.decoder_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_500000/state.param_states.decoder.decoder_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f4757fbb41a5f3b04f2ba3df2a7573932532fb4977030819d01cbdda4d8d5334
3
+ size 959
checkpoint_500000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_500000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35df72b5ce24be102dad91b61e0d71ce817fd18c2b606c58fc7afcbcbf0d5c84
3
+ size 981
checkpoint_500000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_500000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c752b12095d6e2beab1e15487e9ffa3cf081b2bc92f5e39ab7b3e26cf4ebbb90
3
+ size 964
checkpoint_500000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_500000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ad9cf86894cdf51c0fdbbcb0de49270ec66628949b4c63a8a94129449f9467fe
3
+ size 990
checkpoint_500000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_500000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a57215f0f6883b5610a6b8f3834035b0499c86da8cc9145f5c209b35b0c4361
3
+ size 983
checkpoint_500000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_500000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb1f74d468062ae9d448759cde8d3ba5062e094450b6bdb53e9e37bc4fc73220
3
+ size 978
checkpoint_500000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_500000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57628356878c1af1713f805422f5eb0eea942df9cd09227bc5d10aca64a15ba1
3
+ size 999
checkpoint_500000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_500000/state.param_states.decoder.layers_2.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84b1ee6fac4232600776045ed0131ffb3bf1dcb37c608e6beedd321e6524e193
3
+ size 976
checkpoint_500000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_500000/state.param_states.decoder.layers_2.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d18bce9293a4836b74725eb793727003191e2213feeddc480859fe4224c4ea6
3
+ size 969
checkpoint_500000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_500000/state.param_states.decoder.layers_2.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4cf6362db3bc23024882ae85c0410f8d81d4febf413fd4bf2263c3a10c039454
3
+ size 984
checkpoint_500000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_500000/state.param_states.decoder.layers_3.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7de94bfad05f55d25c0acd083b1156da4045358b3dbc56a3939388715ab6e9f1
3
+ size 964
checkpoint_500000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_500000/state.param_states.decoder.layers_3.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:51d21994aeaa68818ca620b77202e1f4a3930a921c52466c9d32817366ff3075
3
+ size 955
checkpoint_500000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_500000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b18495b05766fb5979e7e2b25fa733f5de7cf697371a88a0b9832ba5a88bce7
3
+ size 978
checkpoint_500000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_500000/state.param_states.decoder.layers_4.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3e4800347edf69708a2526028710845bf3cb6fa0427d28e0756f41c8ffe3fdc
3
+ size 976
checkpoint_500000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_500000/state.param_states.decoder.layers_4.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05ac892b97782be94128d15a52d50b125fab135ce9904698f89063c354295145
3
+ size 960
checkpoint_500000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_500000/state.param_states.decoder.layers_4.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7165b17eb33ea12bbff9e82525a3a8849c55e8dd697dc53aca897fcd187e9f81
3
+ size 979
checkpoint_500000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_500000/state.param_states.decoder.layers_5.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ee6e807e3e759b7285333266bf747dae6541e603299c8b9fc249e403e626f5c
3
+ size 983
checkpoint_500000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_500000/state.param_states.decoder.layers_5.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e5939aea44e6420737bc7137f1349569f36d40739a61fce33125b03a8d4e356
3
+ size 981
checkpoint_500000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_500000/state.param_states.decoder.layers_5.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57836882c1824d7ae56668dd502c3f265dcdd21209794f85a0abf2325de181f7
3
+ size 963
checkpoint_500000/state.param_states.decoder.relpos_bias.rel_embedding.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29b0b4f4727db7bbeacbac66511f4e0ea2d73d7e962302934561781052f7e5c3
3
+ size 170
checkpoint_500000/state.param_states.decoder.relpos_bias.rel_embedding.v/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1756cfcb9f1960f815f865cf3031323ed1c58d78a119efcc233a8fe8cd57d70
3
+ size 535
checkpoint_500000/state.param_states.encoder.encoder_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_500000/state.param_states.encoder.encoder_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a31d466a081bf453647a2dfa6de6638d8712d15a359856d0b21d045bda4c076
3
+ size 988
checkpoint_500000/state.param_states.encoder.layers_0.pre_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_500000/state.param_states.encoder.layers_0.pre_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:06bf96f74d0fb72aee2ab4529da7d6a413b9f6d9f0a94b504cca72678667ce1a
3
+ size 950
checkpoint_500000/state.param_states.encoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_500000/state.param_states.encoder.layers_0.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ffb5d0490ef73897bdd72596869cdd73babb18c6325b580e271d961737d1f7a
3
+ size 966
checkpoint_500000/state.param_states.encoder.layers_1.pre_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168
checkpoint_500000/state.param_states.encoder.layers_1.pre_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e1d03a6ec5f9d7f30e39b0dc985475c60eaab99c3be24ca58fd41b55317b020
3
+ size 968
checkpoint_500000/state.param_states.encoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b8d96750cc3cb29fdf9654317e87644d16122c4608cd0e0ef63723aa2aee992
3
+ size 168