File size: 470 Bytes
32dc2d8
 
 
 
 
650ecb1
 
 
b66b951
650ecb1
32dc2d8
 
650ecb1
 
 
bc01f78
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
python run_seq2seq_flax.py \
	--max_source_length 128 \
	--train_file /data/CC12M/encoded-small-train.tsv \
	--validation_file /data/CC12M/encoded-small-valid.tsv \
	--output_dir output \
	--per_device_train_batch_size 56 \
	--per_device_eval_batch_size 56 \
	--preprocessing_num_workers 80 \
	--warmup_steps 1000 \
	--gradient_accumulation_steps 8 \
	--do_train \
	--do_eval \
	--adafactor \
	--num_train_epochs 1 \
	--max_train_samples 200000 \
	--learning_rate 0.003