aapot commited on
Commit
1aa8b47
1 Parent(s): 81663ba

Add 500k train step and HF flax model

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. checkpoint_500000/checkpoint +3 -0
  2. checkpoint_500000/state.param_states.decoder.decoder_norm.scale.v/.zarray +3 -0
  3. checkpoint_500000/state.param_states.decoder.decoder_norm.scale.v/0 +3 -0
  4. checkpoint_500000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  5. checkpoint_500000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  6. checkpoint_500000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  7. checkpoint_500000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/0 +3 -0
  8. checkpoint_500000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  9. checkpoint_500000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/0 +3 -0
  10. checkpoint_500000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  11. checkpoint_500000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  12. checkpoint_500000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  13. checkpoint_500000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/0 +3 -0
  14. checkpoint_500000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  15. checkpoint_500000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/0 +3 -0
  16. checkpoint_500000/state.param_states.decoder.layers_10.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  17. checkpoint_500000/state.param_states.decoder.layers_10.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  18. checkpoint_500000/state.param_states.decoder.layers_10.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  19. checkpoint_500000/state.param_states.decoder.layers_10.pre_mlp_layer_norm.scale.v/0 +3 -0
  20. checkpoint_500000/state.param_states.decoder.layers_10.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  21. checkpoint_500000/state.param_states.decoder.layers_10.pre_self_attention_layer_norm.scale.v/0 +3 -0
  22. checkpoint_500000/state.param_states.decoder.layers_11.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  23. checkpoint_500000/state.param_states.decoder.layers_11.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  24. checkpoint_500000/state.param_states.decoder.layers_11.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  25. checkpoint_500000/state.param_states.decoder.layers_11.pre_mlp_layer_norm.scale.v/0 +3 -0
  26. checkpoint_500000/state.param_states.decoder.layers_11.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  27. checkpoint_500000/state.param_states.decoder.layers_11.pre_self_attention_layer_norm.scale.v/0 +3 -0
  28. checkpoint_500000/state.param_states.decoder.layers_12.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  29. checkpoint_500000/state.param_states.decoder.layers_12.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  30. checkpoint_500000/state.param_states.decoder.layers_12.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  31. checkpoint_500000/state.param_states.decoder.layers_12.pre_mlp_layer_norm.scale.v/0 +3 -0
  32. checkpoint_500000/state.param_states.decoder.layers_12.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  33. checkpoint_500000/state.param_states.decoder.layers_12.pre_self_attention_layer_norm.scale.v/0 +3 -0
  34. checkpoint_500000/state.param_states.decoder.layers_13.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  35. checkpoint_500000/state.param_states.decoder.layers_13.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  36. checkpoint_500000/state.param_states.decoder.layers_13.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  37. checkpoint_500000/state.param_states.decoder.layers_13.pre_mlp_layer_norm.scale.v/0 +3 -0
  38. checkpoint_500000/state.param_states.decoder.layers_13.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  39. checkpoint_500000/state.param_states.decoder.layers_13.pre_self_attention_layer_norm.scale.v/0 +3 -0
  40. checkpoint_500000/state.param_states.decoder.layers_14.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  41. checkpoint_500000/state.param_states.decoder.layers_14.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  42. checkpoint_500000/state.param_states.decoder.layers_14.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  43. checkpoint_500000/state.param_states.decoder.layers_14.pre_mlp_layer_norm.scale.v/0 +3 -0
  44. checkpoint_500000/state.param_states.decoder.layers_14.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
  45. checkpoint_500000/state.param_states.decoder.layers_14.pre_self_attention_layer_norm.scale.v/0 +3 -0
  46. checkpoint_500000/state.param_states.decoder.layers_15.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
  47. checkpoint_500000/state.param_states.decoder.layers_15.pre_cross_attention_layer_norm.scale.v/0 +3 -0
  48. checkpoint_500000/state.param_states.decoder.layers_15.pre_mlp_layer_norm.scale.v/.zarray +3 -0
  49. checkpoint_500000/state.param_states.decoder.layers_15.pre_mlp_layer_norm.scale.v/0 +3 -0
  50. checkpoint_500000/state.param_states.decoder.layers_15.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
checkpoint_500000/checkpoint ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:030260556a01c81cdd4d9010b421211e92351e1041ae8a87d35284baccd28b8d
3
+ size 8513341
checkpoint_500000/state.param_states.decoder.decoder_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_500000/state.param_states.decoder.decoder_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75e2af8c29cbb48b7145d1abde22e14baed61b9f3f68c82482934cd4d63820a9
3
+ size 3553
checkpoint_500000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_500000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a15c8185b7e93f014ad9a4036a082d2c39d5e3764b3bb463afd13c74115cf685
3
+ size 3764
checkpoint_500000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_500000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b86d0e11dcaaf0564b45321e4dde7ebed77e9d633b995f4e989335cee089e0de
3
+ size 3776
checkpoint_500000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_500000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3e219cef34a87b6586f888dd4d2eabb4a48fd6b39810cebdc9c00165b4a99f5
3
+ size 3675
checkpoint_500000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_500000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2efdf391e98eb31b10aae77b9711a4a35a63c9946cbad5bcb272bcacddea6d1
3
+ size 3741
checkpoint_500000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_500000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4e78f30bfa85a1cd4dc85301dbf7da9d359d01b14b14c84abd416f57e61509b
3
+ size 3739
checkpoint_500000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_500000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4df02b7118054d49227e22e549b9952244ff04a96088bb69d606b9d4bf64957
3
+ size 3769
checkpoint_500000/state.param_states.decoder.layers_10.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_500000/state.param_states.decoder.layers_10.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f5db81f827b659386ab96a3ba82715f251e420234dd54ce7a8e17d34537a5c1
3
+ size 3849
checkpoint_500000/state.param_states.decoder.layers_10.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_500000/state.param_states.decoder.layers_10.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f73ad2aa5bcff78644a081c2201ca40af22d5b483ae2b924eb86bbc7dbea3152
3
+ size 3773
checkpoint_500000/state.param_states.decoder.layers_10.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_500000/state.param_states.decoder.layers_10.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91f8f8be478c40479b5bbae53010e2d37a4d31650277bce8d691fd83afc22f6d
3
+ size 3799
checkpoint_500000/state.param_states.decoder.layers_11.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_500000/state.param_states.decoder.layers_11.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:efcd90e9d052bf1ff5597c4134c712ab9c5addeb73c535739ed25fe21345c65e
3
+ size 3829
checkpoint_500000/state.param_states.decoder.layers_11.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_500000/state.param_states.decoder.layers_11.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d21523b72080c7b85398a6739eb81e7a03a1d60a2f3b54357dd07dd0400837d5
3
+ size 3798
checkpoint_500000/state.param_states.decoder.layers_11.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_500000/state.param_states.decoder.layers_11.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1cb718043fd544341c47c6ad57e7653d7490721fad68b7bf9d2893650c56616e
3
+ size 3777
checkpoint_500000/state.param_states.decoder.layers_12.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_500000/state.param_states.decoder.layers_12.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d1b964f11e642a03f54e9add53dccff5f96162c14e846cad5ed9cab5616ca29
3
+ size 3813
checkpoint_500000/state.param_states.decoder.layers_12.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_500000/state.param_states.decoder.layers_12.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f9787dc5f4a52310c0f1827969d9ab989631bee2ad8cdc2b66727dbd5823004
3
+ size 3770
checkpoint_500000/state.param_states.decoder.layers_12.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_500000/state.param_states.decoder.layers_12.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26a05686b5647312ed9a7087dea8bc4246f8e7924d53db04c17ce64ea0417af7
3
+ size 3768
checkpoint_500000/state.param_states.decoder.layers_13.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_500000/state.param_states.decoder.layers_13.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fde7b4d989a6d9de675c964269bf6e40daab3e4e6d06dd9d080e8ace979d1dfc
3
+ size 3836
checkpoint_500000/state.param_states.decoder.layers_13.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_500000/state.param_states.decoder.layers_13.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91706f229289d93fba8ebc14be0b16295c5a71df71c1490396ff9a3a59f87837
3
+ size 3765
checkpoint_500000/state.param_states.decoder.layers_13.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_500000/state.param_states.decoder.layers_13.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:55a2d0eabdfd3eca152c1297065a1f4c2a13acd9a4b257cf566e061823dc0639
3
+ size 3757
checkpoint_500000/state.param_states.decoder.layers_14.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_500000/state.param_states.decoder.layers_14.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a56b72523ab4d24e13af7b148d14ba80c0db1f1382f255eba35df19d2a5b2ce
3
+ size 3786
checkpoint_500000/state.param_states.decoder.layers_14.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_500000/state.param_states.decoder.layers_14.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14672e963ed6cdd5b81521eedd46b34fd73b5223ba22dc61f8147114a6b5f0c6
3
+ size 3717
checkpoint_500000/state.param_states.decoder.layers_14.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_500000/state.param_states.decoder.layers_14.pre_self_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:504f79e63815d29fc013bcd1147a8f1c80cd03527f3cc883f2114b0a0d0b5e43
3
+ size 3759
checkpoint_500000/state.param_states.decoder.layers_15.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_500000/state.param_states.decoder.layers_15.pre_cross_attention_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b0b9eb5a8488cb168ddc9176e54329a61662245c235e9dc44b4a18d58e2d155b
3
+ size 3791
checkpoint_500000/state.param_states.decoder.layers_15.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170
checkpoint_500000/state.param_states.decoder.layers_15.pre_mlp_layer_norm.scale.v/0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:432e6a821d13e7a93ec0444dbacd8076b0b01c01d33f033171cf345f8a583b50
3
+ size 3736
checkpoint_500000/state.param_states.decoder.layers_15.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:775db7db7452b8ae662659f5556db09104afc5fefff029c0df59f241b9fb0b07
3
+ size 170