hanasim commited on
Commit
21fd474
·
verified ·
1 Parent(s): 0fff16a

End of training

Browse files
README.md CHANGED
@@ -1,21 +1,24 @@
1
  ---
 
 
2
  license: apache-2.0
3
  base_model: openai/whisper-small
4
  tags:
 
5
  - generated_from_trainer
6
  datasets:
7
- - common_voice_16_0
8
  metrics:
9
  - wer
10
  model-index:
11
- - name: breeze-listen-dsw-small-ml
12
  results:
13
  - task:
14
  name: Automatic Speech Recognition
15
  type: automatic-speech-recognition
16
  dataset:
17
- name: common_voice_16_0
18
- type: common_voice_16_0
19
  config: ml
20
  split: test
21
  args: ml
@@ -28,9 +31,9 @@ model-index:
28
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
29
  should probably proofread and complete it, then remove this comment. -->
30
 
31
- # breeze-listen-dsw-small-ml
32
 
33
- This model is a fine-tuned version of [openai/whisper-small](https://huggingface.co/openai/whisper-small) on the common_voice_16_0 dataset.
34
  It achieves the following results on the evaluation set:
35
  - Loss: 0.3826
36
  - Wer: 33.9203
 
1
  ---
2
+ language:
3
+ - ml
4
  license: apache-2.0
5
  base_model: openai/whisper-small
6
  tags:
7
+ - whisper-event
8
  - generated_from_trainer
9
  datasets:
10
+ - mozilla-foundation/common_voice_16_0
11
  metrics:
12
  - wer
13
  model-index:
14
+ - name: Breeze DSW Malayalam - small
15
  results:
16
  - task:
17
  name: Automatic Speech Recognition
18
  type: automatic-speech-recognition
19
  dataset:
20
+ name: mozilla-foundation/common_voice_16_0 ml
21
+ type: mozilla-foundation/common_voice_16_0
22
  config: ml
23
  split: test
24
  args: ml
 
31
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
32
  should probably proofread and complete it, then remove this comment. -->
33
 
34
+ # Breeze DSW Malayalam - small
35
 
36
+ This model is a fine-tuned version of [openai/whisper-small](https://huggingface.co/openai/whisper-small) on the mozilla-foundation/common_voice_16_0 ml dataset.
37
  It achieves the following results on the evaluation set:
38
  - Loss: 0.3826
39
  - Wer: 33.9203
all_results.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 8.07,
3
+ "eval_loss": 0.382568359375,
4
+ "eval_runtime": 4040.4498,
5
+ "eval_samples_per_second": 0.164,
6
+ "eval_steps_per_second": 0.021,
7
+ "eval_wer": 33.92029657089898,
8
+ "train_loss": 0.0,
9
+ "train_runtime": 18.9864,
10
+ "train_samples_per_second": 842.709,
11
+ "train_steps_per_second": 52.669
12
+ }
eval_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 8.07,
3
+ "eval_loss": 0.382568359375,
4
+ "eval_runtime": 4040.4498,
5
+ "eval_samples_per_second": 0.164,
6
+ "eval_steps_per_second": 0.021,
7
+ "eval_wer": 33.92029657089898
8
+ }
runs/Jan18_17-40-33_knight/events.out.tfevents.1705596099.knight.168415.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:65c13cbc52b10d33456e8113e6986b08ff8ddd150abf08fc445e22b18c59bd66
3
- size 8321
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0be63fdd81af8defaa68a70ef70efc912633f33112c5f19fbdd3f98d6e9b3cbd
3
+ size 12733
runs/Jan19_15-12-42_knight/events.out.tfevents.1705677727.knight.2681.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:edae9303b29a528983793247abb0918fbcf4b0cb6ea4943e97f8c7950c1f227c
3
+ size 406
train_results.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 8.07,
3
+ "train_loss": 0.0,
4
+ "train_runtime": 18.9864,
5
+ "train_samples_per_second": 842.709,
6
+ "train_steps_per_second": 52.669
7
+ }
trainer_state.json ADDED
@@ -0,0 +1,261 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 33.92029657089898,
3
+ "best_model_checkpoint": "/cosmos/home/sp-operator/ai/training/models/huggingface/scripts/../breeze-listen-dsw-small-ml/checkpoint-700",
4
+ "epoch": 8.068,
5
+ "eval_steps": 100,
6
+ "global_step": 700,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.03,
13
+ "learning_rate": 4.898977360288234e-06,
14
+ "loss": 1.5105,
15
+ "step": 25
16
+ },
17
+ {
18
+ "epoch": 0.05,
19
+ "learning_rate": 6.160712527409633e-06,
20
+ "loss": 1.0831,
21
+ "step": 50
22
+ },
23
+ {
24
+ "epoch": 0.07,
25
+ "learning_rate": 6.85912902234906e-06,
26
+ "loss": 0.7569,
27
+ "step": 75
28
+ },
29
+ {
30
+ "epoch": 1.02,
31
+ "learning_rate": 7.344547104469332e-06,
32
+ "loss": 0.4577,
33
+ "step": 100
34
+ },
35
+ {
36
+ "epoch": 1.02,
37
+ "eval_loss": 0.482421875,
38
+ "eval_runtime": 4089.3252,
39
+ "eval_samples_per_second": 0.162,
40
+ "eval_steps_per_second": 0.02,
41
+ "eval_wer": 58.38739573679332,
42
+ "step": 100
43
+ },
44
+ {
45
+ "epoch": 1.05,
46
+ "learning_rate": 7.716963756434345e-06,
47
+ "loss": 0.364,
48
+ "step": 125
49
+ },
50
+ {
51
+ "epoch": 1.07,
52
+ "learning_rate": 8.019180844200955e-06,
53
+ "loss": 0.2875,
54
+ "step": 150
55
+ },
56
+ {
57
+ "epoch": 2.02,
58
+ "learning_rate": 8.27351214279797e-06,
59
+ "loss": 0.2145,
60
+ "step": 175
61
+ },
62
+ {
63
+ "epoch": 2.04,
64
+ "learning_rate": 8.49307723936858e-06,
65
+ "loss": 0.1781,
66
+ "step": 200
67
+ },
68
+ {
69
+ "epoch": 2.04,
70
+ "eval_loss": 0.306640625,
71
+ "eval_runtime": 4087.5604,
72
+ "eval_samples_per_second": 0.162,
73
+ "eval_steps_per_second": 0.02,
74
+ "eval_wer": 41.06580166821131,
75
+ "step": 200
76
+ },
77
+ {
78
+ "epoch": 2.07,
79
+ "learning_rate": 8.686247975778677e-06,
80
+ "loss": 0.1593,
81
+ "step": 225
82
+ },
83
+ {
84
+ "epoch": 3.01,
85
+ "learning_rate": 8.858694625217149e-06,
86
+ "loss": 0.1224,
87
+ "step": 250
88
+ },
89
+ {
90
+ "epoch": 3.04,
91
+ "learning_rate": 9.014436199608479e-06,
92
+ "loss": 0.1031,
93
+ "step": 275
94
+ },
95
+ {
96
+ "epoch": 3.06,
97
+ "learning_rate": 9.156425255148058e-06,
98
+ "loss": 0.0935,
99
+ "step": 300
100
+ },
101
+ {
102
+ "epoch": 3.06,
103
+ "eval_loss": 0.290283203125,
104
+ "eval_runtime": 4061.9776,
105
+ "eval_samples_per_second": 0.163,
106
+ "eval_steps_per_second": 0.02,
107
+ "eval_wer": 35.644114921223355,
108
+ "step": 300
109
+ },
110
+ {
111
+ "epoch": 4.01,
112
+ "learning_rate": 9.28689473531776e-06,
113
+ "loss": 0.0784,
114
+ "step": 325
115
+ },
116
+ {
117
+ "epoch": 4.03,
118
+ "learning_rate": 9.407574351377137e-06,
119
+ "loss": 0.0624,
120
+ "step": 350
121
+ },
122
+ {
123
+ "epoch": 4.06,
124
+ "learning_rate": 9.519831289296397e-06,
125
+ "loss": 0.0557,
126
+ "step": 375
127
+ },
128
+ {
129
+ "epoch": 5.0,
130
+ "learning_rate": 9.624764935335318e-06,
131
+ "loss": 0.057,
132
+ "step": 400
133
+ },
134
+ {
135
+ "epoch": 5.0,
136
+ "eval_loss": 0.328857421875,
137
+ "eval_runtime": 4014.2783,
138
+ "eval_samples_per_second": 0.165,
139
+ "eval_steps_per_second": 0.021,
140
+ "eval_wer": 36.61723818350324,
141
+ "step": 400
142
+ },
143
+ {
144
+ "epoch": 5.03,
145
+ "learning_rate": 9.723272550712454e-06,
146
+ "loss": 0.0364,
147
+ "step": 425
148
+ },
149
+ {
150
+ "epoch": 5.05,
151
+ "learning_rate": 9.816095971633122e-06,
152
+ "loss": 0.0388,
153
+ "step": 450
154
+ },
155
+ {
156
+ "epoch": 6.0,
157
+ "learning_rate": 9.90385555539545e-06,
158
+ "loss": 0.0392,
159
+ "step": 475
160
+ },
161
+ {
162
+ "epoch": 6.03,
163
+ "learning_rate": 9.987075336738768e-06,
164
+ "loss": 0.0285,
165
+ "step": 500
166
+ },
167
+ {
168
+ "epoch": 6.03,
169
+ "eval_loss": 0.342529296875,
170
+ "eval_runtime": 4051.7069,
171
+ "eval_samples_per_second": 0.164,
172
+ "eval_steps_per_second": 0.02,
173
+ "eval_wer": 35.31974050046339,
174
+ "step": 500
175
+ },
176
+ {
177
+ "epoch": 6.05,
178
+ "learning_rate": 9.600000000000001e-06,
179
+ "loss": 0.0279,
180
+ "step": 525
181
+ },
182
+ {
183
+ "epoch": 6.08,
184
+ "learning_rate": 9.100000000000001e-06,
185
+ "loss": 0.0287,
186
+ "step": 550
187
+ },
188
+ {
189
+ "epoch": 7.02,
190
+ "learning_rate": 8.6e-06,
191
+ "loss": 0.0199,
192
+ "step": 575
193
+ },
194
+ {
195
+ "epoch": 7.05,
196
+ "learning_rate": 8.1e-06,
197
+ "loss": 0.0203,
198
+ "step": 600
199
+ },
200
+ {
201
+ "epoch": 7.05,
202
+ "eval_loss": 0.36474609375,
203
+ "eval_runtime": 4154.7446,
204
+ "eval_samples_per_second": 0.16,
205
+ "eval_steps_per_second": 0.02,
206
+ "eval_wer": 34.38368860055607,
207
+ "step": 600
208
+ },
209
+ {
210
+ "epoch": 7.07,
211
+ "learning_rate": 7.600000000000001e-06,
212
+ "loss": 0.0184,
213
+ "step": 625
214
+ },
215
+ {
216
+ "epoch": 8.02,
217
+ "learning_rate": 7.100000000000001e-06,
218
+ "loss": 0.0117,
219
+ "step": 650
220
+ },
221
+ {
222
+ "epoch": 8.04,
223
+ "learning_rate": 6.600000000000001e-06,
224
+ "loss": 0.0098,
225
+ "step": 675
226
+ },
227
+ {
228
+ "epoch": 8.07,
229
+ "learning_rate": 6.1e-06,
230
+ "loss": 0.0103,
231
+ "step": 700
232
+ },
233
+ {
234
+ "epoch": 8.07,
235
+ "eval_loss": 0.382568359375,
236
+ "eval_runtime": 4054.0209,
237
+ "eval_samples_per_second": 0.164,
238
+ "eval_steps_per_second": 0.02,
239
+ "eval_wer": 33.92029657089898,
240
+ "step": 700
241
+ },
242
+ {
243
+ "epoch": 8.07,
244
+ "step": 700,
245
+ "total_flos": 3.213687048481276e+18,
246
+ "train_loss": 0.0,
247
+ "train_runtime": 18.9864,
248
+ "train_samples_per_second": 842.709,
249
+ "train_steps_per_second": 52.669
250
+ }
251
+ ],
252
+ "logging_steps": 25,
253
+ "max_steps": 1000,
254
+ "num_input_tokens_seen": 0,
255
+ "num_train_epochs": 9223372036854775807,
256
+ "save_steps": 100,
257
+ "total_flos": 3.213687048481276e+18,
258
+ "train_batch_size": 16,
259
+ "trial_name": null,
260
+ "trial_params": null
261
+ }