DrishtiSharma commited on
Commit
3013e9b
β€’
1 Parent(s): d843f6a

Training in progress, step 500

Browse files
.ipynb_checkpoints/run-checkpoint.sh CHANGED
@@ -4,11 +4,11 @@ python run_speech_recognition_ctc.py \
4
  --dataset_config_name="pa-IN" \
5
  --output_dir="./" \
6
  --overwrite_output_dir \
7
- --num_train_epochs="200" \
8
  --per_device_train_batch_size="16" \
9
  --per_device_eval_batch_size="8" \
10
  --learning_rate="3e-4" \
11
- --warmup_steps="1500" \
12
  --length_column_name="input_length" \
13
  --evaluation_strategy="steps" \
14
  --text_column_name="sentence" \
@@ -20,9 +20,9 @@ python run_speech_recognition_ctc.py \
20
  --save_total_limit="1" \
21
  --freeze_feature_encoder \
22
  --feat_proj_dropout="0.0" \
23
- --mask_time_prob="0.75" \
24
  --mask_time_length="10" \
25
- --mask_feature_prob="0.25" \
26
  --mask_feature_length="64" \
27
  --chars_to_ignore , ? . ! \- \; \: \" β€œ % β€˜ ” οΏ½ β€” ’ … – Β« Β» β€ž \` _ \
28
  --gradient_checkpointing \
 
4
  --dataset_config_name="pa-IN" \
5
  --output_dir="./" \
6
  --overwrite_output_dir \
7
+ --num_train_epochs="100" \
8
  --per_device_train_batch_size="16" \
9
  --per_device_eval_batch_size="8" \
10
  --learning_rate="3e-4" \
11
+ --warmup_steps="1200" \
12
  --length_column_name="input_length" \
13
  --evaluation_strategy="steps" \
14
  --text_column_name="sentence" \
 
20
  --save_total_limit="1" \
21
  --freeze_feature_encoder \
22
  --feat_proj_dropout="0.0" \
23
+ --mask_time_prob="0.05" \
24
  --mask_time_length="10" \
25
+ --mask_feature_prob="0.05" \
26
  --mask_feature_length="64" \
27
  --chars_to_ignore , ? . ! \- \; \: \" β€œ % β€˜ ” οΏ½ β€” ’ … – Β« Β» β€ž \` _ \
28
  --gradient_checkpointing \
config.json CHANGED
@@ -61,10 +61,10 @@
61
  "layerdrop": 0.0,
62
  "mask_feature_length": 64,
63
  "mask_feature_min_masks": 0,
64
- "mask_feature_prob": 0.25,
65
  "mask_time_length": 10,
66
  "mask_time_min_masks": 2,
67
- "mask_time_prob": 0.75,
68
  "model_type": "wav2vec2",
69
  "num_adapter_layers": 3,
70
  "num_attention_heads": 16,
 
61
  "layerdrop": 0.0,
62
  "mask_feature_length": 64,
63
  "mask_feature_min_masks": 0,
64
+ "mask_feature_prob": 0.05,
65
  "mask_time_length": 10,
66
  "mask_time_min_masks": 2,
67
+ "mask_time_prob": 0.05,
68
  "model_type": "wav2vec2",
69
  "num_adapter_layers": 3,
70
  "num_attention_heads": 16,
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8c4b7517f11637e6acabdd9728be577c8a021ad5019ebc00b7863a59167e474b
3
  size 1262194289
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f3047206709c8430e48b6d738fa94dc80544d7a168c36e603faa2e4e22f5106b
3
  size 1262194289
run.sh CHANGED
@@ -4,11 +4,11 @@ python run_speech_recognition_ctc.py \
4
  --dataset_config_name="pa-IN" \
5
  --output_dir="./" \
6
  --overwrite_output_dir \
7
- --num_train_epochs="200" \
8
  --per_device_train_batch_size="16" \
9
  --per_device_eval_batch_size="8" \
10
  --learning_rate="3e-4" \
11
- --warmup_steps="1500" \
12
  --length_column_name="input_length" \
13
  --evaluation_strategy="steps" \
14
  --text_column_name="sentence" \
@@ -20,9 +20,9 @@ python run_speech_recognition_ctc.py \
20
  --save_total_limit="1" \
21
  --freeze_feature_encoder \
22
  --feat_proj_dropout="0.0" \
23
- --mask_time_prob="0.75" \
24
  --mask_time_length="10" \
25
- --mask_feature_prob="0.25" \
26
  --mask_feature_length="64" \
27
  --chars_to_ignore , ? . ! \- \; \: \" β€œ % β€˜ ” οΏ½ β€” ’ … – Β« Β» β€ž \` _ \
28
  --gradient_checkpointing \
 
4
  --dataset_config_name="pa-IN" \
5
  --output_dir="./" \
6
  --overwrite_output_dir \
7
+ --num_train_epochs="100" \
8
  --per_device_train_batch_size="16" \
9
  --per_device_eval_batch_size="8" \
10
  --learning_rate="3e-4" \
11
+ --warmup_steps="1200" \
12
  --length_column_name="input_length" \
13
  --evaluation_strategy="steps" \
14
  --text_column_name="sentence" \
 
20
  --save_total_limit="1" \
21
  --freeze_feature_encoder \
22
  --feat_proj_dropout="0.0" \
23
+ --mask_time_prob="0.05" \
24
  --mask_time_length="10" \
25
+ --mask_feature_prob="0.05" \
26
  --mask_feature_length="64" \
27
  --chars_to_ignore , ? . ! \- \; \: \" β€œ % β€˜ ” οΏ½ β€” ’ … – Β« Β» β€ž \` _ \
28
  --gradient_checkpointing \
special_tokens_map.json CHANGED
@@ -1 +1 @@
1
- {"bos_token": "<s>", "eos_token": "</s>", "unk_token": "[UNK]", "pad_token": "[PAD]", "additional_special_tokens": [{"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}]}
 
1
+ {"bos_token": "<s>", "eos_token": "</s>", "unk_token": "[UNK]", "pad_token": "[PAD]", "additional_special_tokens": [{"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}]}
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7ce5521e7d5bfb2e376e94f2b63e11df51adac0d076e157e0d59b86829b64f4e
3
  size 2991
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b1aedc4fe7ec92200eafc3ebd49f8423ed1f76a39299859626edb51c651c948
3
  size 2991