sanchit-gandhi HF staff commited on
Commit
03be9c0
1 Parent(s): 8f8f0d5

146ecm8l: saving weights and logs of step 10k

Browse files
Files changed (3) hide show
  1. flax_model.msgpack +3 -0
  2. nohup.out +2 -2
  3. run_cv9.sh +42 -0
flax_model.msgpack ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:671bcc5a57c4f53c53a5fd90632217839c037a7e52557c808bde40c06cdfa004
3
+ size 2353616717
nohup.out CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ff7c786b45a6845a8e77375046d4927ea7c18cea820a6b9c2f86061d6716f2f2
3
- size 10931583
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b3e2c8a38a9a4efed95bb3b51b7726042c407557f84caad27f76fea720cd2e12
3
+ size 8155416
run_cv9.sh ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ #!/usr/bin/env bash
2
+ python ./run_flax_speech_recognition_seq2seq.py \
3
+ --dataset_name=mozilla-foundation/common_voice_9_0 \
4
+ --model_name_or_path=sanchit-gandhi/flax-wav2vec2-2-bart-large-scan \
5
+ --dataset_config_name=en \
6
+ --train_split_name=train \
7
+ --eval_split_name=validation \
8
+ --test_split_name=test \
9
+ --dataset_cache_dir=/home/sanchitgandhi/cache/huggingface/datasets \
10
+ --output_dir=./flax-wav2vec2-2-bart-large-cv9-feature-encoder \
11
+ --preprocessing_num_workers=1 \
12
+ --id_column_name=client_id \
13
+ --length_column_name=input_length \
14
+ --text_column_name=sentence \
15
+ --overwrite_output_dir \
16
+ --per_device_train_batch_size=8 \
17
+ --per_device_eval_batch_size=4 \
18
+ --logging_steps=25 \
19
+ --max_steps=50000 \
20
+ --eval_steps=10000 \
21
+ --save_steps=10000 \
22
+ --gradient_checkpointing \
23
+ --max_duration_in_seconds=20 \
24
+ --max_target_length=128 \
25
+ --generation_max_length=40 \
26
+ --generation_num_beams=1 \
27
+ --generation_length_penalty=1.2 \
28
+ --final_generation_max_length=200 \
29
+ --final_generation_num_beams=5 \
30
+ --learning_rate=1e-4 \
31
+ --warmup_steps=500 \
32
+ --save_total_limit=1 \
33
+ --freeze_feature_encoder=False \
34
+ --predict_with_generate \
35
+ --do_lower_case \
36
+ --do_eval \
37
+ --do_train \
38
+ --do_predict \
39
+ --push_to_hub \
40
+ --use_auth_token \
41
+ --wandb_project=commonvoice_9_0 \
42
+ --wandb_name=flax-wav2vec2-2-bart-large-cv9-feature-encoder