sanchit-gandhi HF staff commited on
Commit
71b88b9
1 Parent(s): 41365be

Add model weights

Browse files
Files changed (3) hide show
  1. .gitattributes +1 -0
  2. medium.en.whisper +3 -0
  3. run_librispeech.sh +38 -0
.gitattributes CHANGED
@@ -30,3 +30,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
30
  *.zip filter=lfs diff=lfs merge=lfs -text
31
  *.zst filter=lfs diff=lfs merge=lfs -text
32
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
30
  *.zip filter=lfs diff=lfs merge=lfs -text
31
  *.zst filter=lfs diff=lfs merge=lfs -text
32
  *tfevents* filter=lfs diff=lfs merge=lfs -text
33
+ *.whisper filter=lfs diff=lfs merge=lfs -text
medium.en.whisper ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e82e4a62220c0dc0aae204900c6061708339307e82694ad61ccd7fcb922193a8
3
+ size 3055771163
run_librispeech.sh ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ #!/usr/bin/env bash
2
+ CUDA_VISIBLE_DEVICES=0 python run_speech_recognition_whisper.py \
3
+ --model_name_or_path="medium.en" \
4
+ --dataset_name="librispeech_asr" \
5
+ --dataset_config_name="all" \
6
+ --train_split_name="train.clean.100+train.clean.360+train.other.500" \
7
+ --eval_split_name="validation.clean" \
8
+ --test_split_name="validation.other+test.clean+test.other" \
9
+ --max_steps="5000" \
10
+ --text_column_name="text" \
11
+ --output_dir="./" \
12
+ --run_name="whisper-ls-960h-5k" \
13
+ --wandb_project="whisper" \
14
+ --per_device_train_batch_size="64" \
15
+ --per_device_eval_batch_size="16" \
16
+ --logging_steps="25" \
17
+ --learning_rate="1e-4" \
18
+ --warmup_steps="500" \
19
+ --report_to="wandb" \
20
+ --preprocessing_num_workers="16" \
21
+ --evaluation_strategy="steps" \
22
+ --eval_steps="1000" \
23
+ --save_strategy="steps" \
24
+ --save_steps="1000" \
25
+ --generation_max_length="224" \
26
+ --length_column_name="input_lengths" \
27
+ --do_lower_case="True" \
28
+ --push_to_hub="False" \
29
+ --gradient_checkpointing \
30
+ --group_by_length \
31
+ --freeze_encoder \
32
+ --fp16 \
33
+ --overwrite_output_dir \
34
+ --do_train \
35
+ --do_eval \
36
+ --do_predict \
37
+ --predict_with_generate \
38
+ --use_auth_token