boris commited on
Commit
5ca30e6
1 Parent(s): 69cf636

feat: update scripts

Browse files
dev/seq2seq/do_big_run.sh CHANGED
@@ -2,15 +2,16 @@ python run_seq2seq_flax.py \
2
  --dataset_repo_or_path dalle-mini/encoded \
3
  --train_file **/train/*/*.jsonl \
4
  --validation_file **/valid/*/*.jsonl \
5
- --len_train 42684248 \
6
- --len_eval 34328 \
 
7
  --streaming \
8
  --normalize_text \
9
  --output_dir output \
10
  --per_device_train_batch_size 56 \
11
  --per_device_eval_batch_size 56 \
12
  --preprocessing_num_workers 80 \
13
- --warmup_steps 500 \
14
  --gradient_accumulation_steps 8 \
15
  --do_train \
16
  --do_eval \
 
2
  --dataset_repo_or_path dalle-mini/encoded \
3
  --train_file **/train/*/*.jsonl \
4
  --validation_file **/valid/*/*.jsonl \
5
+ --len_train 129847128 \
6
+ --len_eval 157312 \
7
+ --eval_steps 1000 \
8
  --streaming \
9
  --normalize_text \
10
  --output_dir output \
11
  --per_device_train_batch_size 56 \
12
  --per_device_eval_batch_size 56 \
13
  --preprocessing_num_workers 80 \
14
+ --warmup_steps 5000 \
15
  --gradient_accumulation_steps 8 \
16
  --do_train \
17
  --do_eval \
dev/seq2seq/do_small_run.sh CHANGED
@@ -1,13 +1,13 @@
1
  python run_seq2seq_flax.py \
2
  --dataset_repo_or_path dalle-mini/encoded \
3
- --train_file **/train/*/*.jsonl \
4
  --validation_file **/valid/*/*.jsonl \
5
- --len_train 42684248 \
6
- --len_eval 34328 \
7
  --streaming \
8
  --output_dir output \
9
- --per_device_train_batch_size 56 \
10
- --per_device_eval_batch_size 56 \
11
  --preprocessing_num_workers 80 \
12
  --warmup_steps 125 \
13
  --gradient_accumulation_steps 8 \
 
1
  python run_seq2seq_flax.py \
2
  --dataset_repo_or_path dalle-mini/encoded \
3
+ --train_file **/train/CC3M/*.jsonl \
4
  --validation_file **/valid/*/*.jsonl \
5
+ --len_train 129847128 \
6
+ --len_eval 157312 \
7
  --streaming \
8
  --output_dir output \
9
+ --per_device_train_batch_size 16 \
10
+ --per_device_eval_batch_size 16 \
11
  --preprocessing_num_workers 80 \
12
  --warmup_steps 125 \
13
  --gradient_accumulation_steps 8 \