sakares commited on
Commit
2071335
1 Parent(s): 8887f4f

increaaase bs=128 and change dtype to fp32

Browse files
Files changed (1) hide show
  1. run.sh +2 -3
run.sh CHANGED
@@ -9,8 +9,8 @@ python3 run_mlm_flax.py \
9
  --max_seq_length="128" \
10
  --weight_decay="0.01" \
11
  --preprocessing_num_workers="64" \
12
- --per_device_train_batch_size="32" \
13
- --per_device_eval_batch_size="32" \
14
  --learning_rate="3e-5" \
15
  --warmup_steps="5000" \
16
  --overwrite_output_dir \
@@ -21,5 +21,4 @@ python3 run_mlm_flax.py \
21
  --logging_steps="500" \
22
  --save_steps="5000" \
23
  --eval_steps="20000" \
24
- --dtype="bfloat16" \
25
  --push_to_hub
 
9
  --max_seq_length="128" \
10
  --weight_decay="0.01" \
11
  --preprocessing_num_workers="64" \
12
+ --per_device_train_batch_size="128" \
13
+ --per_device_eval_batch_size="128" \
14
  --learning_rate="3e-5" \
15
  --warmup_steps="5000" \
16
  --overwrite_output_dir \
 
21
  --logging_steps="500" \
22
  --save_steps="5000" \
23
  --eval_steps="20000" \
 
24
  --push_to_hub