File size: 576 Bytes
e565538
 
 
 
 
 
 
 
 
 
 
 
 
 
 
ebb3343
 
e565538
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
python3 run_dnlm_flax.py \
  --output_dir rotobart_output \
  --overwrite_output_dir \
  --dataset_path wikitext \
  --model_name_or_path rotobart \
  --tokenizer_name vocab-2/the_pile.model \
  --shuffle_buffer_size 100_000 \
  --do_train --do_eval \
  --max_seq_length 1024 \
  --encoder_layers 12 \
  --decoder_layers 12 \
  --per_device_train_batch_size 1 \
  --per_device_eval_batch_size 1 \
  --logging_steps 8 \
  --num_train_steps 1000 \
  --eval_steps 100 \
  --save_steps 100 \
  --num_eval_samples 25 \
  --warmup_steps 30 \
  --learning_rate 1e-4 \
  --use_bf16 \