pere commited on
Commit
38c3eec
1 Parent(s): 61ffd98

Saving weights and logs of step 1000

Browse files
Files changed (4) hide show
  1. config.json +1 -1
  2. flax_model.msgpack +3 -0
  3. run_mlm_flax.py +5 -3
  4. tokenizer.json +0 -0
config.json CHANGED
@@ -19,7 +19,7 @@
19
  "num_hidden_layers": 12,
20
  "pad_token_id": 1,
21
  "position_embedding_type": "absolute",
22
- "transformers_version": "4.16.0.dev0",
23
  "type_vocab_size": 1,
24
  "use_cache": true,
25
  "vocab_size": 50265
 
19
  "num_hidden_layers": 12,
20
  "pad_token_id": 1,
21
  "position_embedding_type": "absolute",
22
+ "transformers_version": "4.15.0.dev0",
23
  "type_vocab_size": 1,
24
  "use_cache": true,
25
  "vocab_size": 50265
flax_model.msgpack ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8a3c81da267a58c6a608e02805349a57f920f73b26045f844af75f892dd9866
3
+ size 498796983
run_mlm_flax.py CHANGED
@@ -777,10 +777,12 @@ def main():
777
  # save checkpoint after each epoch and push checkpoint to the hub
778
  if jax.process_index() == 0:
779
  params = jax.device_get(jax.tree_map(lambda x: x[0], state.params))
780
- model.save_pretrained(training_args.output_dir, params=params)
 
 
 
 
781
  tokenizer.save_pretrained(training_args.output_dir)
782
- if training_args.push_to_hub:
783
- repo.push_to_hub(commit_message=f"Saving weights and logs of step {cur_step}", blocking=False)
784
 
785
  # Eval after training
786
  if training_args.do_eval:
 
777
  # save checkpoint after each epoch and push checkpoint to the hub
778
  if jax.process_index() == 0:
779
  params = jax.device_get(jax.tree_map(lambda x: x[0], state.params))
780
+ model.save_pretrained(training_args.output_dir,
781
+ params=params,
782
+ push_to_hub=training_args.push_to_hub,
783
+ commit_message=f"Saving weights and logs of step {cur_step}",
784
+ )
785
  tokenizer.save_pretrained(training_args.output_dir)
 
 
786
 
787
  # Eval after training
788
  if training_args.do_eval:
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff