sanchit-gandhi's picture
146ecm8l: saving weights and logs of step 10k
03be9c0
#!/usr/bin/env bash
python ./run_flax_speech_recognition_seq2seq.py \
--dataset_name=mozilla-foundation/common_voice_9_0 \
--model_name_or_path=sanchit-gandhi/flax-wav2vec2-2-bart-large-scan \
--dataset_config_name=en \
--train_split_name=train \
--eval_split_name=validation \
--test_split_name=test \
--dataset_cache_dir=/home/sanchitgandhi/cache/huggingface/datasets \
--output_dir=./flax-wav2vec2-2-bart-large-cv9-feature-encoder \
--preprocessing_num_workers=1 \
--id_column_name=client_id \
--length_column_name=input_length \
--text_column_name=sentence \
--overwrite_output_dir \
--per_device_train_batch_size=8 \
--per_device_eval_batch_size=4 \
--logging_steps=25 \
--max_steps=50000 \
--eval_steps=10000 \
--save_steps=10000 \
--gradient_checkpointing \
--max_duration_in_seconds=20 \
--max_target_length=128 \
--generation_max_length=40 \
--generation_num_beams=1 \
--generation_length_penalty=1.2 \
--final_generation_max_length=200 \
--final_generation_num_beams=5 \
--learning_rate=1e-4 \
--warmup_steps=500 \
--save_total_limit=1 \
--freeze_feature_encoder=False \
--predict_with_generate \
--do_lower_case \
--do_eval \
--do_train \
--do_predict \
--push_to_hub \
--use_auth_token \
--wandb_project=commonvoice_9_0 \
--wandb_name=flax-wav2vec2-2-bart-large-cv9-feature-encoder