aapot commited on
Commit
94f7aaa
1 Parent(s): ec4e3f3

Add 200k train step and HF flax model

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. checkpoint_200000/checkpoint +3 -0
  2. checkpoint_200000/state.param_states.decoder.decoder_norm.scale.v/.zarray +3 -0
  3. checkpoint_200000/state.param_states.decoder.decoder_norm.scale.v/0 +3 -0
  4. checkpoint_200000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  5. checkpoint_200000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  6. checkpoint_200000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  7. checkpoint_200000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/0 +3 -0
  8. checkpoint_200000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  9. checkpoint_200000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/0 +3 -0
  10. checkpoint_200000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  11. checkpoint_200000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  12. checkpoint_200000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  13. checkpoint_200000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/0 +3 -0
  14. checkpoint_200000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  15. checkpoint_200000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/0 +3 -0
  16. checkpoint_200000/state.param_states.decoder.layers_10.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  17. checkpoint_200000/state.param_states.decoder.layers_10.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  18. checkpoint_200000/state.param_states.decoder.layers_10.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  19. checkpoint_200000/state.param_states.decoder.layers_10.pre_mlp_layer_norm.scale.v/0 +3 -0
  20. checkpoint_200000/state.param_states.decoder.layers_10.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  21. checkpoint_200000/state.param_states.decoder.layers_10.pre_self_attention_layer_norm.scale.v/0 +3 -0
  22. checkpoint_200000/state.param_states.decoder.layers_11.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  23. checkpoint_200000/state.param_states.decoder.layers_11.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  24. checkpoint_200000/state.param_states.decoder.layers_11.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  25. checkpoint_200000/state.param_states.decoder.layers_11.pre_mlp_layer_norm.scale.v/0 +3 -0
  26. checkpoint_200000/state.param_states.decoder.layers_11.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  27. checkpoint_200000/state.param_states.decoder.layers_11.pre_self_attention_layer_norm.scale.v/0 +3 -0
  28. checkpoint_200000/state.param_states.decoder.layers_12.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  29. checkpoint_200000/state.param_states.decoder.layers_12.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  30. checkpoint_200000/state.param_states.decoder.layers_12.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  31. checkpoint_200000/state.param_states.decoder.layers_12.pre_mlp_layer_norm.scale.v/0 +3 -0
  32. checkpoint_200000/state.param_states.decoder.layers_12.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  33. checkpoint_200000/state.param_states.decoder.layers_12.pre_self_attention_layer_norm.scale.v/0 +3 -0
  34. checkpoint_200000/state.param_states.decoder.layers_13.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  35. checkpoint_200000/state.param_states.decoder.layers_13.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  36. checkpoint_200000/state.param_states.decoder.layers_13.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  37. checkpoint_200000/state.param_states.decoder.layers_13.pre_mlp_layer_norm.scale.v/0 +3 -0
  38. checkpoint_200000/state.param_states.decoder.layers_13.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  39. checkpoint_200000/state.param_states.decoder.layers_13.pre_self_attention_layer_norm.scale.v/0 +3 -0
  40. checkpoint_200000/state.param_states.decoder.layers_14.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  41. checkpoint_200000/state.param_states.decoder.layers_14.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  42. checkpoint_200000/state.param_states.decoder.layers_14.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  43. checkpoint_200000/state.param_states.decoder.layers_14.pre_mlp_layer_norm.scale.v/0 +3 -0
  44. checkpoint_200000/state.param_states.decoder.layers_14.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  45. checkpoint_200000/state.param_states.decoder.layers_14.pre_self_attention_layer_norm.scale.v/0 +3 -0
  46. checkpoint_200000/state.param_states.decoder.layers_15.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  47. checkpoint_200000/state.param_states.decoder.layers_15.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  48. checkpoint_200000/state.param_states.decoder.layers_15.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  49. checkpoint_200000/state.param_states.decoder.layers_15.pre_mlp_layer_norm.scale.v/0 +3 -0
  50. checkpoint_200000/state.param_states.decoder.layers_15.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
checkpoint_200000/checkpoint ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f32d3da06e1795b76ce7de4414465ecb7c6b857bb28536e094ec54d92ac38d3d
3
+ size 8513341
checkpoint_200000/state.param_states.decoder.decoder_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_200000/state.param_states.decoder.decoder_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a4c551432493eb80cb0b27a2219f38ac720e4541bdfe53be8e3b1d23a361dfd
3
+ size 3546
checkpoint_200000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_200000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b44af75fe156eef2d3883766f9f421f984f9b283b5cd75b6fe2f0beaf368f681
3
+ size 3644
checkpoint_200000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_200000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:efca4b7da6cd16f06b4dacb5a9f0e9f3f923a4dda0c122ed34f3e6c8a0b9c27b
3
+ size 3408
checkpoint_200000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_200000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64e26a424e0a9dc26248a0ccbb9a816982c649c65dea292737d8d87c81e48114
3
+ size 3524
checkpoint_200000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_200000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8db81d23f824f3bd545d612852aa63e011e529c6281db96f8ccd79a45e8123dc
3
+ size 3583
checkpoint_200000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_200000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2009afff1c3c3539457a1869ead68177465c488724b897d849117f781a433f1c
3
+ size 3491
checkpoint_200000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_200000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d3d38d9b9d047973fde1c371fa4384f5682e7b6c7ca2d4fec60bbc727abae25
3
+ size 3685
checkpoint_200000/state.param_states.decoder.layers_10.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_200000/state.param_states.decoder.layers_10.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11bf41fcd9fb5a66e5da993509c9a761bd4ae44254269e1b80a5054025ab82e6
3
+ size 3647
checkpoint_200000/state.param_states.decoder.layers_10.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_200000/state.param_states.decoder.layers_10.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed4544edf070a85fc04f470ae9948a2ed64f6324072d1ee26d0dd191f9ad333d
3
+ size 3526
checkpoint_200000/state.param_states.decoder.layers_10.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_200000/state.param_states.decoder.layers_10.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05ddcac9b374489575e84276928fe9087eeecf4860be3b438f1d0700c30bf495
3
+ size 3687
checkpoint_200000/state.param_states.decoder.layers_11.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_200000/state.param_states.decoder.layers_11.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a548538b7d8ecb37df4005b01b57e3ba04ba5e132f833f43070091c5d037a87
3
+ size 3547
checkpoint_200000/state.param_states.decoder.layers_11.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_200000/state.param_states.decoder.layers_11.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72b29fd1db8d8cc656a3e6366b9e7425889532fa310fdef06bc4be7cb9ba38ec
3
+ size 3531
checkpoint_200000/state.param_states.decoder.layers_11.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_200000/state.param_states.decoder.layers_11.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ac93dfabc1ed2948951b614d0c94ed9f6c1796ab6c045eea8704df656e99eba
3
+ size 3580
checkpoint_200000/state.param_states.decoder.layers_12.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_200000/state.param_states.decoder.layers_12.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91524f495eeb1d73882c607edfdc8df40f28a5e9bd5e7d92d6d1f4cb4f26ee18
3
+ size 3588
checkpoint_200000/state.param_states.decoder.layers_12.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_200000/state.param_states.decoder.layers_12.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98ba6af38c1e82ba9008fbe0278fed14b4044cd86dd39159bcbe1c97752c9367
3
+ size 3533
checkpoint_200000/state.param_states.decoder.layers_12.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_200000/state.param_states.decoder.layers_12.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83ef655d67b8fe0e2fcf79d3821917499347967c7c36cc6262660ed3b16aabe8
3
+ size 3576
checkpoint_200000/state.param_states.decoder.layers_13.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_200000/state.param_states.decoder.layers_13.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ad82f79c98b8e07a6ab1d20ba9dcd57996b41674289143c556fe00af535882b2
3
+ size 3534
checkpoint_200000/state.param_states.decoder.layers_13.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_200000/state.param_states.decoder.layers_13.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25d27f9a29d15ae6499c96834e40b0e0861d33a1109a729cc4c28b274e55041e
3
+ size 3538
checkpoint_200000/state.param_states.decoder.layers_13.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_200000/state.param_states.decoder.layers_13.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d4f02b6265a7a29df987d4673a1ac2b7e2dfb3be6fa6f8755925cb55c73e2aa5
3
+ size 3654
checkpoint_200000/state.param_states.decoder.layers_14.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_200000/state.param_states.decoder.layers_14.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3655d5c8ee2ad8d458ac5cfad174a3ddf6f422bb6f478dc9d87f92784d31cf5d
3
+ size 3603
checkpoint_200000/state.param_states.decoder.layers_14.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_200000/state.param_states.decoder.layers_14.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d403040bd926d7665ee1e9f2c78ed78f20ae97c956b8d13dd72917064d905b7
3
+ size 3516
checkpoint_200000/state.param_states.decoder.layers_14.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_200000/state.param_states.decoder.layers_14.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d84452bc16e08266c7e067b2abe122c07f354e097a5b2674ae3f3454edf46ecf
3
+ size 3569
checkpoint_200000/state.param_states.decoder.layers_15.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_200000/state.param_states.decoder.layers_15.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78c11bd725cd6fdc90806a8c3db4ba4b6d1dda9e1f7985b92b032e26556bf6a6
3
+ size 3559
checkpoint_200000/state.param_states.decoder.layers_15.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_200000/state.param_states.decoder.layers_15.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c91e77d722fe6e1897fef02ceb457ce66a49327e55496efdd5befa13a568a79c
3
+ size 3522
checkpoint_200000/state.param_states.decoder.layers_15.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170