evertonaleixo commited on
Commit
5ffd4ce
1 Parent(s): 48929b9

Training in progress, step 500

Browse files
Files changed (4) hide show
  1. README.md +9 -33
  2. config.json +9 -11
  3. pytorch_model.bin +2 -2
  4. training_args.bin +1 -1
README.md CHANGED
@@ -1,40 +1,23 @@
1
  ---
 
 
2
  license: apache-2.0
3
- base_model: openai/whisper-tiny
4
  tags:
5
  - generated_from_trainer
6
  datasets:
7
- - PolyAI/minds14
8
- metrics:
9
- - wer
10
  model-index:
11
- - name: whisper-small-dv
12
- results:
13
- - task:
14
- name: Automatic Speech Recognition
15
- type: automatic-speech-recognition
16
- dataset:
17
- name: PolyAI/minds14
18
- type: PolyAI/minds14
19
- config: en-US
20
- split: train
21
- args: en-US
22
- metrics:
23
- - name: Wer
24
- type: wer
25
- value: 0.0
26
  ---
27
 
28
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
29
  should probably proofread and complete it, then remove this comment. -->
30
 
31
- # whisper-small-dv
32
 
33
- This model is a fine-tuned version of [openai/whisper-tiny](https://huggingface.co/openai/whisper-tiny) on the PolyAI/minds14 dataset.
34
- It achieves the following results on the evaluation set:
35
- - Loss: 0.0000
36
- - Wer Ortho: 0.0
37
- - Wer: 0.0
38
 
39
  ## Model description
40
 
@@ -60,14 +43,7 @@ The following hyperparameters were used during training:
60
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
61
  - lr_scheduler_type: constant_with_warmup
62
  - lr_scheduler_warmup_steps: 50
63
- - training_steps: 50
64
-
65
- ### Training results
66
-
67
- | Training Loss | Epoch | Step | Validation Loss | Wer Ortho | Wer |
68
- |:-------------:|:-----:|:----:|:---------------:|:---------:|:---:|
69
- | 0.0 | 1.79 | 50 | 0.0000 | 0.0 | 0.0 |
70
-
71
 
72
  ### Framework versions
73
 
 
1
  ---
2
+ language:
3
+ - dv
4
  license: apache-2.0
5
+ base_model: openai/whisper-small
6
  tags:
7
  - generated_from_trainer
8
  datasets:
9
+ - mozilla-foundation/common_voice_13_0
 
 
10
  model-index:
11
+ - name: Whisper Small Dv
12
+ results: []
 
 
 
 
 
 
 
 
 
 
 
 
 
13
  ---
14
 
15
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
16
  should probably proofread and complete it, then remove this comment. -->
17
 
18
+ # Whisper Small Dv
19
 
20
+ This model is a fine-tuned version of [openai/whisper-small](https://huggingface.co/openai/whisper-small) on the Common Voice 13 dataset.
 
 
 
 
21
 
22
  ## Model description
23
 
 
43
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
44
  - lr_scheduler_type: constant_with_warmup
45
  - lr_scheduler_warmup_steps: 50
46
+ - training_steps: 500
 
 
 
 
 
 
 
47
 
48
  ### Framework versions
49
 
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "CordwainerSmith/whisper-tiny-PolyAI-minds14",
3
  "activation_dropout": 0.0,
4
  "activation_function": "gelu",
5
  "apply_spec_augment": false,
@@ -13,17 +13,17 @@
13
  ],
14
  "bos_token_id": 50257,
15
  "classifier_proj_size": 256,
16
- "d_model": 384,
17
- "decoder_attention_heads": 6,
18
- "decoder_ffn_dim": 1536,
19
  "decoder_layerdrop": 0.0,
20
- "decoder_layers": 4,
21
  "decoder_start_token_id": 50258,
22
  "dropout": 0.0,
23
- "encoder_attention_heads": 6,
24
- "encoder_ffn_dim": 1536,
25
  "encoder_layerdrop": 0.0,
26
- "encoder_layers": 4,
27
  "eos_token_id": 50257,
28
  "forced_decoder_ids": [
29
  [
@@ -52,7 +52,7 @@
52
  "max_target_positions": 448,
53
  "median_filter_width": 7,
54
  "model_type": "whisper",
55
- "num_hidden_layers": 4,
56
  "num_mel_bins": 80,
57
  "pad_token_id": 50257,
58
  "scale_embedding": false,
@@ -140,8 +140,6 @@
140
  49870,
141
  50254,
142
  50258,
143
- 50358,
144
- 50359,
145
  50360,
146
  50361,
147
  50362
 
1
  {
2
+ "_name_or_path": "sanchit-gandhi/whisper-small-dv",
3
  "activation_dropout": 0.0,
4
  "activation_function": "gelu",
5
  "apply_spec_augment": false,
 
13
  ],
14
  "bos_token_id": 50257,
15
  "classifier_proj_size": 256,
16
+ "d_model": 768,
17
+ "decoder_attention_heads": 12,
18
+ "decoder_ffn_dim": 3072,
19
  "decoder_layerdrop": 0.0,
20
+ "decoder_layers": 12,
21
  "decoder_start_token_id": 50258,
22
  "dropout": 0.0,
23
+ "encoder_attention_heads": 12,
24
+ "encoder_ffn_dim": 3072,
25
  "encoder_layerdrop": 0.0,
26
+ "encoder_layers": 12,
27
  "eos_token_id": 50257,
28
  "forced_decoder_ids": [
29
  [
 
52
  "max_target_positions": 448,
53
  "median_filter_width": 7,
54
  "model_type": "whisper",
55
+ "num_hidden_layers": 12,
56
  "num_mel_bins": 80,
57
  "pad_token_id": 50257,
58
  "scale_embedding": false,
 
140
  49870,
141
  50254,
142
  50258,
 
 
143
  50360,
144
  50361,
145
  50362
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a8bd1112ab6515cbdea9590ae1dcfeaa4840dbb67e622df77bf382238a5b88ae
3
- size 151099049
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f99c86b534ca911d9e4bbeafca9617d07cba0de1f06dafd069db00c5ae222fc
3
+ size 967102729
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:21b047d135c1ffae4b14b50622c87ebab8ce4e795df4b97fc0328c7e0f38ff37
3
  size 4219
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71cf6cca35c37866adfa57f660b0cda218a99db43945d1e9c1caaac5b4cf87be
3
  size 4219