Coletomyo commited on
Commit
3679e1d
1 Parent(s): 5d24bf8

optional-commit-message

Browse files
README.md CHANGED
@@ -2,7 +2,6 @@
2
  language:
3
  - mn
4
  license: apache-2.0
5
- base_model: openai/whisper-large-v2
6
  tags:
7
  - hf-asr-leaderboard
8
  - generated_from_trainer
@@ -10,12 +9,13 @@ datasets:
10
  - mozilla-foundation/common_voice_16_0
11
  metrics:
12
  - wer
 
13
  model-index:
14
  - name: Whisper Large Mongolian
15
  results:
16
  - task:
17
- name: Automatic Speech Recognition
18
  type: automatic-speech-recognition
 
19
  dataset:
20
  name: Common Voice 16.0
21
  type: mozilla-foundation/common_voice_16_0
@@ -23,9 +23,9 @@ model-index:
23
  split: None
24
  args: 'config: mn, split: test'
25
  metrics:
26
- - name: Wer
27
- type: wer
28
  value: 37.23357981731187
 
29
  ---
30
 
31
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
2
  language:
3
  - mn
4
  license: apache-2.0
 
5
  tags:
6
  - hf-asr-leaderboard
7
  - generated_from_trainer
 
9
  - mozilla-foundation/common_voice_16_0
10
  metrics:
11
  - wer
12
+ base_model: openai/whisper-large-v2
13
  model-index:
14
  - name: Whisper Large Mongolian
15
  results:
16
  - task:
 
17
  type: automatic-speech-recognition
18
+ name: Automatic Speech Recognition
19
  dataset:
20
  name: Common Voice 16.0
21
  type: mozilla-foundation/common_voice_16_0
 
23
  split: None
24
  args: 'config: mn, split: test'
25
  metrics:
26
+ - type: wer
 
27
  value: 37.23357981731187
28
+ name: Wer
29
  ---
30
 
31
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
config.json CHANGED
@@ -25,7 +25,20 @@
25
  "encoder_layerdrop": 0.0,
26
  "encoder_layers": 32,
27
  "eos_token_id": 50257,
28
- "forced_decoder_ids": null,
 
 
 
 
 
 
 
 
 
 
 
 
 
29
  "init_std": 0.02,
30
  "is_encoder_decoder": true,
31
  "mask_feature_length": 10,
@@ -43,9 +56,98 @@
43
  "num_mel_bins": 80,
44
  "pad_token_id": 50257,
45
  "scale_embedding": false,
46
- "suppress_tokens": [],
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
47
  "torch_dtype": "float32",
48
- "transformers_version": "4.39.0.dev0",
49
  "use_cache": true,
50
  "use_weighted_layer_sum": false,
51
  "vocab_size": 51865
 
25
  "encoder_layerdrop": 0.0,
26
  "encoder_layers": 32,
27
  "eos_token_id": 50257,
28
+ "forced_decoder_ids": [
29
+ [
30
+ 1,
31
+ 50259
32
+ ],
33
+ [
34
+ 2,
35
+ 50359
36
+ ],
37
+ [
38
+ 3,
39
+ 50363
40
+ ]
41
+ ],
42
  "init_std": 0.02,
43
  "is_encoder_decoder": true,
44
  "mask_feature_length": 10,
 
56
  "num_mel_bins": 80,
57
  "pad_token_id": 50257,
58
  "scale_embedding": false,
59
+ "suppress_tokens": [
60
+ 1,
61
+ 2,
62
+ 7,
63
+ 8,
64
+ 9,
65
+ 10,
66
+ 14,
67
+ 25,
68
+ 26,
69
+ 27,
70
+ 28,
71
+ 29,
72
+ 31,
73
+ 58,
74
+ 59,
75
+ 60,
76
+ 61,
77
+ 62,
78
+ 63,
79
+ 90,
80
+ 91,
81
+ 92,
82
+ 93,
83
+ 359,
84
+ 503,
85
+ 522,
86
+ 542,
87
+ 873,
88
+ 893,
89
+ 902,
90
+ 918,
91
+ 922,
92
+ 931,
93
+ 1350,
94
+ 1853,
95
+ 1982,
96
+ 2460,
97
+ 2627,
98
+ 3246,
99
+ 3253,
100
+ 3268,
101
+ 3536,
102
+ 3846,
103
+ 3961,
104
+ 4183,
105
+ 4667,
106
+ 6585,
107
+ 6647,
108
+ 7273,
109
+ 9061,
110
+ 9383,
111
+ 10428,
112
+ 10929,
113
+ 11938,
114
+ 12033,
115
+ 12331,
116
+ 12562,
117
+ 13793,
118
+ 14157,
119
+ 14635,
120
+ 15265,
121
+ 15618,
122
+ 16553,
123
+ 16604,
124
+ 18362,
125
+ 18956,
126
+ 20075,
127
+ 21675,
128
+ 22520,
129
+ 26130,
130
+ 26161,
131
+ 26435,
132
+ 28279,
133
+ 29464,
134
+ 31650,
135
+ 32302,
136
+ 32470,
137
+ 36865,
138
+ 42863,
139
+ 47425,
140
+ 49870,
141
+ 50254,
142
+ 50258,
143
+ 50358,
144
+ 50359,
145
+ 50360,
146
+ 50361,
147
+ 50362
148
+ ],
149
  "torch_dtype": "float32",
150
+ "transformers_version": "4.37.2",
151
  "use_cache": true,
152
  "use_weighted_layer_sum": false,
153
  "vocab_size": 51865
generation_config.json CHANGED
@@ -212,7 +212,6 @@
212
  "<|yo|>": 50325,
213
  "<|zh|>": 50260
214
  },
215
- "language": "mn",
216
  "max_initial_timestamp_index": 50,
217
  "max_length": 448,
218
  "no_timestamps_token_id": 50363,
@@ -313,5 +312,5 @@
313
  "transcribe": 50359,
314
  "translate": 50358
315
  },
316
- "transformers_version": "4.39.0.dev0"
317
  }
 
212
  "<|yo|>": 50325,
213
  "<|zh|>": 50260
214
  },
 
215
  "max_initial_timestamp_index": 50,
216
  "max_length": 448,
217
  "no_timestamps_token_id": 50363,
 
312
  "transcribe": 50359,
313
  "translate": 50358
314
  },
315
+ "transformers_version": "4.37.2"
316
  }
model-00001-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e33ed6c7bde441d0c1d42a6e3f1f11e14957462266f1ee45d21b78e8640a5cdd
3
  size 4992706480
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:74a9fc8ea3fb1810298d1ed34154ff295867d0a54570f38573c470bfdcf231a9
3
  size 4992706480
model-00002-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:857b8c0b798ec4c81074f6f20cb2915f192f6c561423b0acd60147b8313ce491
3
  size 1180663192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c6c46b5bb35b8b60b7bf75a388b3a8a5387c935e907990c5608359da0c4c69c
3
  size 1180663192