csikasote commited on
Commit
c3f6a57
·
verified ·
1 Parent(s): 37b3e07

End of training

Browse files
Files changed (5) hide show
  1. README.md +16 -4
  2. all_results.json +15 -0
  3. eval_results.json +9 -0
  4. train_results.json +9 -0
  5. trainer_state.json +506 -0
README.md CHANGED
@@ -4,11 +4,23 @@ license: apache-2.0
4
  base_model: openai/whisper-medium
5
  tags:
6
  - generated_from_trainer
 
 
7
  metrics:
8
  - wer
9
  model-index:
10
  - name: whisper-medium-nyagen-female-model
11
- results: []
 
 
 
 
 
 
 
 
 
 
12
  ---
13
 
14
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -16,10 +28,10 @@ should probably proofread and complete it, then remove this comment. -->
16
 
17
  # whisper-medium-nyagen-female-model
18
 
19
- This model is a fine-tuned version of [openai/whisper-medium](https://huggingface.co/openai/whisper-medium) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
- - Loss: 0.4384
22
- - Wer: 0.2314
23
 
24
  ## Model description
25
 
 
4
  base_model: openai/whisper-medium
5
  tags:
6
  - generated_from_trainer
7
+ datasets:
8
+ - nyagen
9
  metrics:
10
  - wer
11
  model-index:
12
  - name: whisper-medium-nyagen-female-model
13
+ results:
14
+ - task:
15
+ name: Automatic Speech Recognition
16
+ type: automatic-speech-recognition
17
+ dataset:
18
+ name: nyagen
19
+ type: nyagen
20
+ metrics:
21
+ - name: Wer
22
+ type: wer
23
+ value: 0.25738585496866606
24
  ---
25
 
26
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
28
 
29
  # whisper-medium-nyagen-female-model
30
 
31
+ This model is a fine-tuned version of [openai/whisper-medium](https://huggingface.co/openai/whisper-medium) on the nyagen dataset.
32
  It achieves the following results on the evaluation set:
33
+ - Loss: 0.3796
34
+ - Wer: 0.2574
35
 
36
  ## Model description
37
 
all_results.json ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 8.284023668639053,
3
+ "eval_loss": 0.3796495497226715,
4
+ "eval_runtime": 80.4724,
5
+ "eval_samples": 169,
6
+ "eval_samples_per_second": 2.1,
7
+ "eval_steps_per_second": 0.534,
8
+ "eval_wer": 0.25738585496866606,
9
+ "total_flos": 1.140628044644352e+19,
10
+ "train_loss": 0.6191167198973042,
11
+ "train_runtime": 2923.212,
12
+ "train_samples": 1349,
13
+ "train_samples_per_second": 13.684,
14
+ "train_steps_per_second": 1.71
15
+ }
eval_results.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 8.284023668639053,
3
+ "eval_loss": 0.3796495497226715,
4
+ "eval_runtime": 80.4724,
5
+ "eval_samples": 169,
6
+ "eval_samples_per_second": 2.1,
7
+ "eval_steps_per_second": 0.534,
8
+ "eval_wer": 0.25738585496866606
9
+ }
train_results.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 8.284023668639053,
3
+ "total_flos": 1.140628044644352e+19,
4
+ "train_loss": 0.6191167198973042,
5
+ "train_runtime": 2923.212,
6
+ "train_samples": 1349,
7
+ "train_samples_per_second": 13.684,
8
+ "train_steps_per_second": 1.71
9
+ }
trainer_state.json ADDED
@@ -0,0 +1,506 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.3796495497226715,
3
+ "best_model_checkpoint": "/scratch/skscla001/speech/results/whisper-medium-nyagen-female-model/checkpoint-800",
4
+ "epoch": 8.284023668639053,
5
+ "eval_steps": 200,
6
+ "global_step": 1400,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.14792899408284024,
13
+ "grad_norm": 51.66197204589844,
14
+ "learning_rate": 4.2000000000000006e-07,
15
+ "loss": 5.8232,
16
+ "step": 25
17
+ },
18
+ {
19
+ "epoch": 0.2958579881656805,
20
+ "grad_norm": 44.10362243652344,
21
+ "learning_rate": 9.200000000000001e-07,
22
+ "loss": 4.7067,
23
+ "step": 50
24
+ },
25
+ {
26
+ "epoch": 0.4437869822485207,
27
+ "grad_norm": 28.569969177246094,
28
+ "learning_rate": 1.42e-06,
29
+ "loss": 3.4308,
30
+ "step": 75
31
+ },
32
+ {
33
+ "epoch": 0.591715976331361,
34
+ "grad_norm": 30.82530975341797,
35
+ "learning_rate": 1.9200000000000003e-06,
36
+ "loss": 2.6134,
37
+ "step": 100
38
+ },
39
+ {
40
+ "epoch": 0.7396449704142012,
41
+ "grad_norm": 25.239219665527344,
42
+ "learning_rate": 2.42e-06,
43
+ "loss": 1.9457,
44
+ "step": 125
45
+ },
46
+ {
47
+ "epoch": 0.8875739644970414,
48
+ "grad_norm": 22.162986755371094,
49
+ "learning_rate": 2.92e-06,
50
+ "loss": 1.6779,
51
+ "step": 150
52
+ },
53
+ {
54
+ "epoch": 1.0355029585798816,
55
+ "grad_norm": 20.636507034301758,
56
+ "learning_rate": 3.4200000000000007e-06,
57
+ "loss": 1.4326,
58
+ "step": 175
59
+ },
60
+ {
61
+ "epoch": 1.183431952662722,
62
+ "grad_norm": 26.6777400970459,
63
+ "learning_rate": 3.920000000000001e-06,
64
+ "loss": 1.1709,
65
+ "step": 200
66
+ },
67
+ {
68
+ "epoch": 1.183431952662722,
69
+ "eval_loss": 0.6064821481704712,
70
+ "eval_runtime": 82.6612,
71
+ "eval_samples_per_second": 2.044,
72
+ "eval_steps_per_second": 0.52,
73
+ "eval_wer": 0.39973142345568485,
74
+ "step": 200
75
+ },
76
+ {
77
+ "epoch": 1.331360946745562,
78
+ "grad_norm": 25.014854431152344,
79
+ "learning_rate": 4.42e-06,
80
+ "loss": 1.0305,
81
+ "step": 225
82
+ },
83
+ {
84
+ "epoch": 1.4792899408284024,
85
+ "grad_norm": 17.5407772064209,
86
+ "learning_rate": 4.92e-06,
87
+ "loss": 0.9408,
88
+ "step": 250
89
+ },
90
+ {
91
+ "epoch": 1.6272189349112427,
92
+ "grad_norm": 21.393421173095703,
93
+ "learning_rate": 5.420000000000001e-06,
94
+ "loss": 0.9531,
95
+ "step": 275
96
+ },
97
+ {
98
+ "epoch": 1.7751479289940828,
99
+ "grad_norm": 17.972383499145508,
100
+ "learning_rate": 5.92e-06,
101
+ "loss": 0.8432,
102
+ "step": 300
103
+ },
104
+ {
105
+ "epoch": 1.9230769230769231,
106
+ "grad_norm": 14.931800842285156,
107
+ "learning_rate": 6.42e-06,
108
+ "loss": 0.8653,
109
+ "step": 325
110
+ },
111
+ {
112
+ "epoch": 2.0710059171597632,
113
+ "grad_norm": 15.048805236816406,
114
+ "learning_rate": 6.92e-06,
115
+ "loss": 0.6679,
116
+ "step": 350
117
+ },
118
+ {
119
+ "epoch": 2.2189349112426036,
120
+ "grad_norm": 13.169198036193848,
121
+ "learning_rate": 7.420000000000001e-06,
122
+ "loss": 0.4734,
123
+ "step": 375
124
+ },
125
+ {
126
+ "epoch": 2.366863905325444,
127
+ "grad_norm": 9.416093826293945,
128
+ "learning_rate": 7.92e-06,
129
+ "loss": 0.4797,
130
+ "step": 400
131
+ },
132
+ {
133
+ "epoch": 2.366863905325444,
134
+ "eval_loss": 0.4227275848388672,
135
+ "eval_runtime": 88.219,
136
+ "eval_samples_per_second": 1.916,
137
+ "eval_steps_per_second": 0.487,
138
+ "eval_wer": 0.39077887197851385,
139
+ "step": 400
140
+ },
141
+ {
142
+ "epoch": 2.5147928994082838,
143
+ "grad_norm": 17.11431884765625,
144
+ "learning_rate": 8.42e-06,
145
+ "loss": 0.5092,
146
+ "step": 425
147
+ },
148
+ {
149
+ "epoch": 2.662721893491124,
150
+ "grad_norm": 12.54430103302002,
151
+ "learning_rate": 8.920000000000001e-06,
152
+ "loss": 0.4516,
153
+ "step": 450
154
+ },
155
+ {
156
+ "epoch": 2.8106508875739644,
157
+ "grad_norm": 12.5538911819458,
158
+ "learning_rate": 9.42e-06,
159
+ "loss": 0.4576,
160
+ "step": 475
161
+ },
162
+ {
163
+ "epoch": 2.9585798816568047,
164
+ "grad_norm": 13.34439754486084,
165
+ "learning_rate": 9.920000000000002e-06,
166
+ "loss": 0.4957,
167
+ "step": 500
168
+ },
169
+ {
170
+ "epoch": 3.106508875739645,
171
+ "grad_norm": 8.777567863464355,
172
+ "learning_rate": 9.953333333333333e-06,
173
+ "loss": 0.3319,
174
+ "step": 525
175
+ },
176
+ {
177
+ "epoch": 3.2544378698224854,
178
+ "grad_norm": 2.8179187774658203,
179
+ "learning_rate": 9.89777777777778e-06,
180
+ "loss": 0.2229,
181
+ "step": 550
182
+ },
183
+ {
184
+ "epoch": 3.4023668639053253,
185
+ "grad_norm": 6.126067161560059,
186
+ "learning_rate": 9.842222222222223e-06,
187
+ "loss": 0.2144,
188
+ "step": 575
189
+ },
190
+ {
191
+ "epoch": 3.5502958579881656,
192
+ "grad_norm": 8.303226470947266,
193
+ "learning_rate": 9.786666666666667e-06,
194
+ "loss": 0.2388,
195
+ "step": 600
196
+ },
197
+ {
198
+ "epoch": 3.5502958579881656,
199
+ "eval_loss": 0.39361897110939026,
200
+ "eval_runtime": 81.4549,
201
+ "eval_samples_per_second": 2.075,
202
+ "eval_steps_per_second": 0.528,
203
+ "eval_wer": 0.29319606087735006,
204
+ "step": 600
205
+ },
206
+ {
207
+ "epoch": 3.698224852071006,
208
+ "grad_norm": 14.067414283752441,
209
+ "learning_rate": 9.731111111111113e-06,
210
+ "loss": 0.2556,
211
+ "step": 625
212
+ },
213
+ {
214
+ "epoch": 3.8461538461538463,
215
+ "grad_norm": 10.964970588684082,
216
+ "learning_rate": 9.675555555555555e-06,
217
+ "loss": 0.2364,
218
+ "step": 650
219
+ },
220
+ {
221
+ "epoch": 3.994082840236686,
222
+ "grad_norm": 12.65548324584961,
223
+ "learning_rate": 9.620000000000001e-06,
224
+ "loss": 0.3048,
225
+ "step": 675
226
+ },
227
+ {
228
+ "epoch": 4.1420118343195265,
229
+ "grad_norm": 13.840071678161621,
230
+ "learning_rate": 9.564444444444445e-06,
231
+ "loss": 0.1798,
232
+ "step": 700
233
+ },
234
+ {
235
+ "epoch": 4.289940828402367,
236
+ "grad_norm": 5.432651042938232,
237
+ "learning_rate": 9.508888888888889e-06,
238
+ "loss": 0.1384,
239
+ "step": 725
240
+ },
241
+ {
242
+ "epoch": 4.437869822485207,
243
+ "grad_norm": 4.243218898773193,
244
+ "learning_rate": 9.453333333333335e-06,
245
+ "loss": 0.1131,
246
+ "step": 750
247
+ },
248
+ {
249
+ "epoch": 4.585798816568047,
250
+ "grad_norm": 8.833934783935547,
251
+ "learning_rate": 9.397777777777779e-06,
252
+ "loss": 0.1031,
253
+ "step": 775
254
+ },
255
+ {
256
+ "epoch": 4.733727810650888,
257
+ "grad_norm": 10.180987358093262,
258
+ "learning_rate": 9.342222222222223e-06,
259
+ "loss": 0.1376,
260
+ "step": 800
261
+ },
262
+ {
263
+ "epoch": 4.733727810650888,
264
+ "eval_loss": 0.3796495497226715,
265
+ "eval_runtime": 80.6054,
266
+ "eval_samples_per_second": 2.097,
267
+ "eval_steps_per_second": 0.533,
268
+ "eval_wer": 0.25738585496866606,
269
+ "step": 800
270
+ },
271
+ {
272
+ "epoch": 4.881656804733728,
273
+ "grad_norm": 7.904026985168457,
274
+ "learning_rate": 9.286666666666667e-06,
275
+ "loss": 0.1003,
276
+ "step": 825
277
+ },
278
+ {
279
+ "epoch": 5.029585798816568,
280
+ "grad_norm": 3.1111233234405518,
281
+ "learning_rate": 9.231111111111111e-06,
282
+ "loss": 0.1213,
283
+ "step": 850
284
+ },
285
+ {
286
+ "epoch": 5.177514792899408,
287
+ "grad_norm": 4.056166648864746,
288
+ "learning_rate": 9.175555555555557e-06,
289
+ "loss": 0.073,
290
+ "step": 875
291
+ },
292
+ {
293
+ "epoch": 5.325443786982248,
294
+ "grad_norm": 3.2874598503112793,
295
+ "learning_rate": 9.12e-06,
296
+ "loss": 0.0756,
297
+ "step": 900
298
+ },
299
+ {
300
+ "epoch": 5.4733727810650885,
301
+ "grad_norm": 6.1852641105651855,
302
+ "learning_rate": 9.064444444444447e-06,
303
+ "loss": 0.0681,
304
+ "step": 925
305
+ },
306
+ {
307
+ "epoch": 5.621301775147929,
308
+ "grad_norm": 8.725586891174316,
309
+ "learning_rate": 9.008888888888889e-06,
310
+ "loss": 0.08,
311
+ "step": 950
312
+ },
313
+ {
314
+ "epoch": 5.769230769230769,
315
+ "grad_norm": 6.852264881134033,
316
+ "learning_rate": 8.953333333333335e-06,
317
+ "loss": 0.0522,
318
+ "step": 975
319
+ },
320
+ {
321
+ "epoch": 5.9171597633136095,
322
+ "grad_norm": 5.19258975982666,
323
+ "learning_rate": 8.897777777777779e-06,
324
+ "loss": 0.0765,
325
+ "step": 1000
326
+ },
327
+ {
328
+ "epoch": 5.9171597633136095,
329
+ "eval_loss": 0.4010450541973114,
330
+ "eval_runtime": 83.2846,
331
+ "eval_samples_per_second": 2.029,
332
+ "eval_steps_per_second": 0.516,
333
+ "eval_wer": 0.28424350940017906,
334
+ "step": 1000
335
+ },
336
+ {
337
+ "epoch": 6.06508875739645,
338
+ "grad_norm": 9.290264129638672,
339
+ "learning_rate": 8.842222222222223e-06,
340
+ "loss": 0.056,
341
+ "step": 1025
342
+ },
343
+ {
344
+ "epoch": 6.21301775147929,
345
+ "grad_norm": 5.741577625274658,
346
+ "learning_rate": 8.786666666666668e-06,
347
+ "loss": 0.042,
348
+ "step": 1050
349
+ },
350
+ {
351
+ "epoch": 6.3609467455621305,
352
+ "grad_norm": 2.9526829719543457,
353
+ "learning_rate": 8.73111111111111e-06,
354
+ "loss": 0.0346,
355
+ "step": 1075
356
+ },
357
+ {
358
+ "epoch": 6.508875739644971,
359
+ "grad_norm": 4.198945999145508,
360
+ "learning_rate": 8.675555555555556e-06,
361
+ "loss": 0.049,
362
+ "step": 1100
363
+ },
364
+ {
365
+ "epoch": 6.65680473372781,
366
+ "grad_norm": 4.736867427825928,
367
+ "learning_rate": 8.62e-06,
368
+ "loss": 0.053,
369
+ "step": 1125
370
+ },
371
+ {
372
+ "epoch": 6.804733727810651,
373
+ "grad_norm": 4.120213985443115,
374
+ "learning_rate": 8.564444444444445e-06,
375
+ "loss": 0.054,
376
+ "step": 1150
377
+ },
378
+ {
379
+ "epoch": 6.952662721893491,
380
+ "grad_norm": 4.600209712982178,
381
+ "learning_rate": 8.50888888888889e-06,
382
+ "loss": 0.0383,
383
+ "step": 1175
384
+ },
385
+ {
386
+ "epoch": 7.100591715976331,
387
+ "grad_norm": 2.9512381553649902,
388
+ "learning_rate": 8.453333333333334e-06,
389
+ "loss": 0.0344,
390
+ "step": 1200
391
+ },
392
+ {
393
+ "epoch": 7.100591715976331,
394
+ "eval_loss": 0.4033794701099396,
395
+ "eval_runtime": 80.3421,
396
+ "eval_samples_per_second": 2.104,
397
+ "eval_steps_per_second": 0.535,
398
+ "eval_wer": 0.23813786929274844,
399
+ "step": 1200
400
+ },
401
+ {
402
+ "epoch": 7.2485207100591715,
403
+ "grad_norm": 2.454542636871338,
404
+ "learning_rate": 8.397777777777778e-06,
405
+ "loss": 0.0303,
406
+ "step": 1225
407
+ },
408
+ {
409
+ "epoch": 7.396449704142012,
410
+ "grad_norm": 3.2096927165985107,
411
+ "learning_rate": 8.342222222222222e-06,
412
+ "loss": 0.0315,
413
+ "step": 1250
414
+ },
415
+ {
416
+ "epoch": 7.544378698224852,
417
+ "grad_norm": 5.889292240142822,
418
+ "learning_rate": 8.286666666666668e-06,
419
+ "loss": 0.0183,
420
+ "step": 1275
421
+ },
422
+ {
423
+ "epoch": 7.6923076923076925,
424
+ "grad_norm": 4.196884632110596,
425
+ "learning_rate": 8.231111111111112e-06,
426
+ "loss": 0.0363,
427
+ "step": 1300
428
+ },
429
+ {
430
+ "epoch": 7.840236686390533,
431
+ "grad_norm": 5.16650390625,
432
+ "learning_rate": 8.175555555555556e-06,
433
+ "loss": 0.0376,
434
+ "step": 1325
435
+ },
436
+ {
437
+ "epoch": 7.988165680473373,
438
+ "grad_norm": 2.2055373191833496,
439
+ "learning_rate": 8.120000000000002e-06,
440
+ "loss": 0.025,
441
+ "step": 1350
442
+ },
443
+ {
444
+ "epoch": 8.136094674556213,
445
+ "grad_norm": 1.7722326517105103,
446
+ "learning_rate": 8.064444444444444e-06,
447
+ "loss": 0.0166,
448
+ "step": 1375
449
+ },
450
+ {
451
+ "epoch": 8.284023668639053,
452
+ "grad_norm": 2.3344950675964355,
453
+ "learning_rate": 8.00888888888889e-06,
454
+ "loss": 0.0207,
455
+ "step": 1400
456
+ },
457
+ {
458
+ "epoch": 8.284023668639053,
459
+ "eval_loss": 0.4384337067604065,
460
+ "eval_runtime": 79.5932,
461
+ "eval_samples_per_second": 2.123,
462
+ "eval_steps_per_second": 0.54,
463
+ "eval_wer": 0.2314234556848702,
464
+ "step": 1400
465
+ },
466
+ {
467
+ "epoch": 8.284023668639053,
468
+ "step": 1400,
469
+ "total_flos": 1.140628044644352e+19,
470
+ "train_loss": 0.6191167198973042,
471
+ "train_runtime": 2923.212,
472
+ "train_samples_per_second": 13.684,
473
+ "train_steps_per_second": 1.71
474
+ }
475
+ ],
476
+ "logging_steps": 25,
477
+ "max_steps": 5000,
478
+ "num_input_tokens_seen": 0,
479
+ "num_train_epochs": 30,
480
+ "save_steps": 200,
481
+ "stateful_callbacks": {
482
+ "EarlyStoppingCallback": {
483
+ "args": {
484
+ "early_stopping_patience": 3,
485
+ "early_stopping_threshold": 0.0
486
+ },
487
+ "attributes": {
488
+ "early_stopping_patience_counter": 3
489
+ }
490
+ },
491
+ "TrainerControl": {
492
+ "args": {
493
+ "should_epoch_stop": false,
494
+ "should_evaluate": false,
495
+ "should_log": false,
496
+ "should_save": true,
497
+ "should_training_stop": true
498
+ },
499
+ "attributes": {}
500
+ }
501
+ },
502
+ "total_flos": 1.140628044644352e+19,
503
+ "train_batch_size": 4,
504
+ "trial_name": null,
505
+ "trial_params": null
506
+ }