AlexN
/

xls-r-300m-fr

Automatic Speech Recognition

Generated from Trainer

hf-asr-leaderboard

mozilla-foundation/common_voice_8_0

robust-speech-event

Inference Endpoints

Model card Files Files and versions Community

AlexN commited on Jan 28, 2022

Commit

37f8bf6

•

1 Parent(s): 6da6a4b

initial commit

Files changed (1) hide show

run.sh +40 -0

run.sh ADDED Viewed

	@@ -0,0 +1,40 @@

+WANDB_PROJECT=auto-speech-recognition-french
+python run_speech_recognition_ctc.py \
+--dataset_name="mozilla-foundation/common_voice_8_0" \
+--model_name_or_path="facebook/wav2vec2-xls-r-300m" \
+--dataset_config_name="fr" \
+--output_dir="./" \
+--overwrite_output_dir \
+--num_train_epochs="5" \
+--per_device_train_batch_size="32" \
+--per_device_eval_batch_size="32" \
+--gradient_accumulation_steps="1" \
+--learning_rate="7e-5" \
+--warmup_steps="1500" \
+--length_column_name="input_length" \
+--evaluation_strategy="steps" \
+--text_column_name="sentence" \
+--save_steps="500" \
+--eval_steps="500" \
+--logging_steps="100" \
+--layerdrop="0.0" \
+--activation_dropout="0.1" \
+--save_total_limit="3" \
+--freeze_feature_encoder \
+--feat_proj_dropout="0.0" \
+--mask_time_prob="0.15" \
+--mask_time_length="10" \
+--mask_feature_prob="0.3" \
+--mask_feature_length="10" \
+--gradient_checkpointing \
+--report_to="wandb" \
+--run_name="xls-r-300m-fr" \
+--max_eval_samples="4000" \
+--max_duration_in_seconds="5" \
+--use_auth_token \
+--fp16 \
+--group_by_length \
+--preprocessing_num_workers="64" \
+--do_train --do_eval \
+--load_best_model_at_end \
+--push_to_hub