w11wo commited on
Commit
daa5037
1 Parent(s): 677d035

Saving weights and logs of epoch 1

Browse files
events.out.tfevents.1625825107.t1v-n-b95d739e-w-0.172623.3.v2 → events.out.tfevents.1625848981.t1v-n-b95d739e-w-0.195447.3.v2 RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0e20a3b8b97c289a397b20b2c4d4300223d194b7dd9967272c6f575bc756a67d
3
  size 3581817
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:553197e40e1ee37f960da354350ed70147d500b9887c5c46dc7caa0d5d15f635
3
  size 3581817
flax_model.msgpack CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3903ba16f2702cb02d4cbc39d63a80d5264c9a4389fefcf48c05986133f500f3
3
  size 711588089
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e4a15d3a3656c720be8f016191292ed4fd5ec92a7b80f9226fad84210702158
3
  size 711588089
nohup.out CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f6d2a0bcc862bb1cff548f19aa1ce5d5314ed010bc327bda0876e0f0df804c03
3
- size 2037187
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5372b784c18a06c3f8582bd4711dc0b69cff87f87abb4355c4e10163b99f38ab
3
+ size 4112389
run.sh CHANGED
@@ -12,7 +12,7 @@ python3 run_mlm_flax.py \
12
  --preprocessing_num_workers="64" \
13
  --per_device_train_batch_size="128" \
14
  --per_device_eval_batch_size="128" \
15
- --learning_rate="2e-4" \
16
  --warmup_steps="1000" \
17
  --overwrite_output_dir \
18
  --num_train_epochs="10" \
 
12
  --preprocessing_num_workers="64" \
13
  --per_device_train_batch_size="128" \
14
  --per_device_eval_batch_size="128" \
15
+ --learning_rate="2e-5" \
16
  --warmup_steps="1000" \
17
  --overwrite_output_dir \
18
  --num_train_epochs="10" \