sanchit-gandhi HF staff commited on
Commit
e1cca7b
1 Parent(s): 83960ec

librispeech 960h

Browse files
Files changed (1) hide show
  1. run_librispeech.sh +14 -14
run_librispeech.sh CHANGED
@@ -2,23 +2,25 @@
2
  python run_flax_speech_recognition_seq2seq.py \
3
  --dataset_name="librispeech_asr" \
4
  --model_name_or_path="./" \
5
- --dataset_config_name="clean" \
6
- --train_split_name="train.100" \
7
- --eval_split_name="validation" \
8
- --dataset_cache_dir="~/cache/huggingface/datasets" \
9
- --output_dir="./" \
10
  --preprocessing_num_workers="16" \
11
  --length_column_name="input_length" \
12
  --overwrite_output_dir \
13
- --num_train_epochs="10" \
14
- --per_device_train_batch_size="4" \
15
- --per_device_eval_batch_size="4" \
16
- --gradient_accumulation_steps="1" \
17
  --logging_steps="25" \
18
- --max_duration_in_seconds="10" \
19
- --max_target_length="64" \
 
20
  --generation_max_length="40" \
21
  --generation_num_beams="1" \
 
 
22
  --learning_rate="3e-4" \
23
  --warmup_steps="500" \
24
  --text_column_name="text" \
@@ -28,7 +30,5 @@ python run_flax_speech_recognition_seq2seq.py \
28
  --do_lower_case \
29
  --do_eval \
30
  --do_train \
31
- --push_to_hub \
32
- --use_auth_token \
33
- --wandb_project="flax-wav2vec2-2-bart-large"
34
 
 
2
  python run_flax_speech_recognition_seq2seq.py \
3
  --dataset_name="librispeech_asr" \
4
  --model_name_or_path="./" \
5
+ --dataset_config_name="all" \
6
+ --train_split_name="train.clean.100+train.clean.360+train.other.500" \
7
+ --eval_split_name="validation.clean" \
8
+ --dataset_cache_dir="/home/sanchitgandhi/cache/huggingface/datasets" \
9
+ --output_dir="./output_dir" \
10
  --preprocessing_num_workers="16" \
11
  --length_column_name="input_length" \
12
  --overwrite_output_dir \
13
+ --num_train_epochs="3" \
14
+ --per_device_train_batch_size="8" \
15
+ --per_device_eval_batch_size="2" \
 
16
  --logging_steps="25" \
17
+ --gradient_checkpointing \
18
+ --max_duration_in_seconds="20" \
19
+ --max_target_length="128" \
20
  --generation_max_length="40" \
21
  --generation_num_beams="1" \
22
+ --final_generation_max_length="200" \
23
+ --final_generation_num_beams="5" \
24
  --learning_rate="3e-4" \
25
  --warmup_steps="500" \
26
  --text_column_name="text" \
 
30
  --do_lower_case \
31
  --do_eval \
32
  --do_train \
33
+ --wandb_project="flax-wav2vec2-2-bart-large-960h"
 
 
34