Patrick von Platen commited on
Commit
4ced1f4
1 Parent(s): d4943b3

Saving weights and logs of step 10000

Browse files
config.json CHANGED
@@ -23,7 +23,7 @@
23
  "pad_token_id": 0,
24
  "relative_attention_num_buckets": 32,
25
  "tie_word_embeddings": false,
26
- "transformers_version": "4.9.0.dev0",
27
  "use_cache": true,
28
  "vocab_size": 32103
29
  }
23
  "pad_token_id": 0,
24
  "relative_attention_num_buckets": 32,
25
  "tie_word_embeddings": false,
26
+ "transformers_version": "4.10.0.dev0",
27
  "use_cache": true,
28
  "vocab_size": 32103
29
  }
events.out.tfevents.1628202584.t1v-n-71556209-w-0.30846.3.v2 ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:686e0d225f325d8f29fec786835c148b9883930d24c1c6b38a53318def837ab8
3
+ size 1467751
flax_model.msgpack CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1eda5211cd924f4a97259363bac36b102ae2c29ff1525a4c7758cc198fb57c73
3
  size 990170015
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c5cc6f959553e9a675e397fcb4e7327932b60711361863457bbaead22534782f
3
  size 990170015
run_t5.sh CHANGED
@@ -14,7 +14,7 @@
14
  --weight_decay="0.001" \
15
  --warmup_steps="2000" \
16
  --overwrite_output_dir \
17
- --logging_steps="100" \
18
- --save_steps="1000" \
19
- --eval_steps="1000" \
20
  --push_to_hub
14
  --weight_decay="0.001" \
15
  --warmup_steps="2000" \
16
  --overwrite_output_dir \
17
+ --logging_steps="500" \
18
+ --save_steps="10000" \
19
+ --eval_steps="2500" \
20
  --push_to_hub