razhan commited on
Commit
c4df450
1 Parent(s): 5695218

End of training

Browse files
Files changed (5) hide show
  1. README.md +14 -2
  2. all_results.json +14 -0
  3. eval_results.json +9 -0
  4. train_results.json +8 -0
  5. trainer_state.json +444 -0
README.md CHANGED
@@ -3,11 +3,23 @@ license: apache-2.0
3
  base_model: openai/whisper-tiny
4
  tags:
5
  - generated_from_trainer
 
 
6
  metrics:
7
  - wer
8
  model-index:
9
  - name: whisper-tiny-ckb
10
- results: []
 
 
 
 
 
 
 
 
 
 
11
  ---
12
 
13
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -15,7 +27,7 @@ should probably proofread and complete it, then remove this comment. -->
15
 
16
  # whisper-tiny-ckb
17
 
18
- This model is a fine-tuned version of [openai/whisper-tiny](https://huggingface.co/openai/whisper-tiny) on an unknown dataset.
19
  It achieves the following results on the evaluation set:
20
  - Loss: 0.2612
21
  - Wer: 0.4780
 
3
  base_model: openai/whisper-tiny
4
  tags:
5
  - generated_from_trainer
6
+ datasets:
7
+ - razhan/common_voice_ckb_16
8
  metrics:
9
  - wer
10
  model-index:
11
  - name: whisper-tiny-ckb
12
+ results:
13
+ - task:
14
+ name: Automatic Speech Recognition
15
+ type: automatic-speech-recognition
16
+ dataset:
17
+ name: razhan/common_voice_ckb_16
18
+ type: razhan/common_voice_ckb_16
19
+ metrics:
20
+ - name: Wer
21
+ type: wer
22
+ value: 0.47801004237740824
23
  ---
24
 
25
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
27
 
28
  # whisper-tiny-ckb
29
 
30
+ This model is a fine-tuned version of [openai/whisper-tiny](https://huggingface.co/openai/whisper-tiny) on the razhan/common_voice_ckb_16 dataset.
31
  It achieves the following results on the evaluation set:
32
  - Loss: 0.2612
33
  - Wer: 0.4780
all_results.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 4.35,
3
+ "eval_loss": 0.26123046875,
4
+ "eval_runtime": 151.8487,
5
+ "eval_samples": 4940,
6
+ "eval_samples_per_second": 32.532,
7
+ "eval_steps_per_second": 0.066,
8
+ "eval_wer": 0.47801004237740824,
9
+ "train_loss": 0.4515265909830729,
10
+ "train_runtime": 14971.1378,
11
+ "train_samples": 105929,
12
+ "train_samples_per_second": 30.779,
13
+ "train_steps_per_second": 0.04
14
+ }
eval_results.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 4.35,
3
+ "eval_loss": 0.26123046875,
4
+ "eval_runtime": 151.8487,
5
+ "eval_samples": 4940,
6
+ "eval_samples_per_second": 32.532,
7
+ "eval_steps_per_second": 0.066,
8
+ "eval_wer": 0.47801004237740824
9
+ }
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 4.35,
3
+ "train_loss": 0.4515265909830729,
4
+ "train_runtime": 14971.1378,
5
+ "train_samples": 105929,
6
+ "train_samples_per_second": 30.779,
7
+ "train_steps_per_second": 0.04
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,444 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.47801004237740824,
3
+ "best_model_checkpoint": "./whisper-tiny-ckb/checkpoint-600",
4
+ "epoch": 4.3478260869565215,
5
+ "eval_steps": 100,
6
+ "global_step": 600,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.07,
13
+ "learning_rate": 2.6164804129562553e-06,
14
+ "loss": 3.7615,
15
+ "step": 10
16
+ },
17
+ {
18
+ "epoch": 0.14,
19
+ "learning_rate": 4.980934789368156e-06,
20
+ "loss": 2.8759,
21
+ "step": 20
22
+ },
23
+ {
24
+ "epoch": 0.22,
25
+ "learning_rate": 5.99823228863792e-06,
26
+ "loss": 2.0115,
27
+ "step": 30
28
+ },
29
+ {
30
+ "epoch": 0.29,
31
+ "learning_rate": 6.655623437887147e-06,
32
+ "loss": 1.4273,
33
+ "step": 40
34
+ },
35
+ {
36
+ "epoch": 0.36,
37
+ "learning_rate": 7.1422479480192775e-06,
38
+ "loss": 1.0629,
39
+ "step": 50
40
+ },
41
+ {
42
+ "epoch": 0.43,
43
+ "learning_rate": 7.528775214088733e-06,
44
+ "loss": 0.864,
45
+ "step": 60
46
+ },
47
+ {
48
+ "epoch": 0.51,
49
+ "learning_rate": 7.849441238868767e-06,
50
+ "loss": 0.69,
51
+ "step": 70
52
+ },
53
+ {
54
+ "epoch": 0.58,
55
+ "learning_rate": 8.123456553166724e-06,
56
+ "loss": 0.5759,
57
+ "step": 80
58
+ },
59
+ {
60
+ "epoch": 0.65,
61
+ "learning_rate": 8.36268666504982e-06,
62
+ "loss": 0.5048,
63
+ "step": 90
64
+ },
65
+ {
66
+ "epoch": 0.72,
67
+ "learning_rate": 8.574976672697987e-06,
68
+ "loss": 0.4502,
69
+ "step": 100
70
+ },
71
+ {
72
+ "epoch": 0.72,
73
+ "eval_loss": 0.498779296875,
74
+ "eval_runtime": 154.3428,
75
+ "eval_samples_per_second": 32.007,
76
+ "eval_steps_per_second": 0.065,
77
+ "eval_wer": 0.7165699227235497,
78
+ "step": 100
79
+ },
80
+ {
81
+ "epoch": 0.8,
82
+ "learning_rate": 8.765784640355151e-06,
83
+ "loss": 0.4391,
84
+ "step": 110
85
+ },
86
+ {
87
+ "epoch": 0.87,
88
+ "learning_rate": 8.93906144297322e-06,
89
+ "loss": 0.4092,
90
+ "step": 120
91
+ },
92
+ {
93
+ "epoch": 0.94,
94
+ "learning_rate": 9.09775921698996e-06,
95
+ "loss": 0.386,
96
+ "step": 130
97
+ },
98
+ {
99
+ "epoch": 1.01,
100
+ "learning_rate": 9.244141981517345e-06,
101
+ "loss": 0.3711,
102
+ "step": 140
103
+ },
104
+ {
105
+ "epoch": 1.09,
106
+ "learning_rate": 9.379984164319582e-06,
107
+ "loss": 0.3478,
108
+ "step": 150
109
+ },
110
+ {
111
+ "epoch": 1.16,
112
+ "learning_rate": 9.50670232443118e-06,
113
+ "loss": 0.3501,
114
+ "step": 160
115
+ },
116
+ {
117
+ "epoch": 1.23,
118
+ "learning_rate": 9.625445353695127e-06,
119
+ "loss": 0.3344,
120
+ "step": 170
121
+ },
122
+ {
123
+ "epoch": 1.3,
124
+ "learning_rate": 9.73715793581418e-06,
125
+ "loss": 0.3167,
126
+ "step": 180
127
+ },
128
+ {
129
+ "epoch": 1.38,
130
+ "learning_rate": 9.842626246843015e-06,
131
+ "loss": 0.3082,
132
+ "step": 190
133
+ },
134
+ {
135
+ "epoch": 1.45,
136
+ "learning_rate": 9.942511545878664e-06,
137
+ "loss": 0.2977,
138
+ "step": 200
139
+ },
140
+ {
141
+ "epoch": 1.45,
142
+ "eval_loss": 0.355712890625,
143
+ "eval_runtime": 154.4865,
144
+ "eval_samples_per_second": 31.977,
145
+ "eval_steps_per_second": 0.065,
146
+ "eval_wer": 0.5858765713471742,
147
+ "step": 200
148
+ },
149
+ {
150
+ "epoch": 1.52,
151
+ "learning_rate": 9.925e-06,
152
+ "loss": 0.3017,
153
+ "step": 210
154
+ },
155
+ {
156
+ "epoch": 1.59,
157
+ "learning_rate": 9.675000000000001e-06,
158
+ "loss": 0.2896,
159
+ "step": 220
160
+ },
161
+ {
162
+ "epoch": 1.67,
163
+ "learning_rate": 9.425e-06,
164
+ "loss": 0.2844,
165
+ "step": 230
166
+ },
167
+ {
168
+ "epoch": 1.74,
169
+ "learning_rate": 9.175000000000001e-06,
170
+ "loss": 0.2729,
171
+ "step": 240
172
+ },
173
+ {
174
+ "epoch": 1.81,
175
+ "learning_rate": 8.925e-06,
176
+ "loss": 0.2675,
177
+ "step": 250
178
+ },
179
+ {
180
+ "epoch": 1.88,
181
+ "learning_rate": 8.675e-06,
182
+ "loss": 0.2796,
183
+ "step": 260
184
+ },
185
+ {
186
+ "epoch": 1.96,
187
+ "learning_rate": 8.425000000000001e-06,
188
+ "loss": 0.2726,
189
+ "step": 270
190
+ },
191
+ {
192
+ "epoch": 2.03,
193
+ "learning_rate": 8.175e-06,
194
+ "loss": 0.2623,
195
+ "step": 280
196
+ },
197
+ {
198
+ "epoch": 2.1,
199
+ "learning_rate": 7.925000000000001e-06,
200
+ "loss": 0.2456,
201
+ "step": 290
202
+ },
203
+ {
204
+ "epoch": 2.17,
205
+ "learning_rate": 7.675e-06,
206
+ "loss": 0.2494,
207
+ "step": 300
208
+ },
209
+ {
210
+ "epoch": 2.17,
211
+ "eval_loss": 0.3095703125,
212
+ "eval_runtime": 165.9821,
213
+ "eval_samples_per_second": 29.762,
214
+ "eval_steps_per_second": 0.06,
215
+ "eval_wer": 0.5314625547523236,
216
+ "step": 300
217
+ },
218
+ {
219
+ "epoch": 2.25,
220
+ "learning_rate": 7.425000000000001e-06,
221
+ "loss": 0.2531,
222
+ "step": 310
223
+ },
224
+ {
225
+ "epoch": 2.32,
226
+ "learning_rate": 7.175000000000001e-06,
227
+ "loss": 0.2496,
228
+ "step": 320
229
+ },
230
+ {
231
+ "epoch": 2.39,
232
+ "learning_rate": 6.925000000000001e-06,
233
+ "loss": 0.2421,
234
+ "step": 330
235
+ },
236
+ {
237
+ "epoch": 2.46,
238
+ "learning_rate": 6.6750000000000005e-06,
239
+ "loss": 0.2337,
240
+ "step": 340
241
+ },
242
+ {
243
+ "epoch": 2.54,
244
+ "learning_rate": 6.425e-06,
245
+ "loss": 0.2358,
246
+ "step": 350
247
+ },
248
+ {
249
+ "epoch": 2.61,
250
+ "learning_rate": 6.175000000000001e-06,
251
+ "loss": 0.2433,
252
+ "step": 360
253
+ },
254
+ {
255
+ "epoch": 2.68,
256
+ "learning_rate": 5.925000000000001e-06,
257
+ "loss": 0.2335,
258
+ "step": 370
259
+ },
260
+ {
261
+ "epoch": 2.75,
262
+ "learning_rate": 5.675000000000001e-06,
263
+ "loss": 0.2301,
264
+ "step": 380
265
+ },
266
+ {
267
+ "epoch": 2.83,
268
+ "learning_rate": 5.4250000000000006e-06,
269
+ "loss": 0.2223,
270
+ "step": 390
271
+ },
272
+ {
273
+ "epoch": 2.9,
274
+ "learning_rate": 5.1750000000000004e-06,
275
+ "loss": 0.2224,
276
+ "step": 400
277
+ },
278
+ {
279
+ "epoch": 2.9,
280
+ "eval_loss": 0.28173828125,
281
+ "eval_runtime": 152.093,
282
+ "eval_samples_per_second": 32.48,
283
+ "eval_steps_per_second": 0.066,
284
+ "eval_wer": 0.5008012535166126,
285
+ "step": 400
286
+ },
287
+ {
288
+ "epoch": 2.97,
289
+ "learning_rate": 4.925e-06,
290
+ "loss": 0.2293,
291
+ "step": 410
292
+ },
293
+ {
294
+ "epoch": 3.04,
295
+ "learning_rate": 4.675000000000001e-06,
296
+ "loss": 0.2255,
297
+ "step": 420
298
+ },
299
+ {
300
+ "epoch": 3.12,
301
+ "learning_rate": 4.425e-06,
302
+ "loss": 0.2131,
303
+ "step": 430
304
+ },
305
+ {
306
+ "epoch": 3.19,
307
+ "learning_rate": 4.175e-06,
308
+ "loss": 0.2106,
309
+ "step": 440
310
+ },
311
+ {
312
+ "epoch": 3.26,
313
+ "learning_rate": 3.9250000000000005e-06,
314
+ "loss": 0.2176,
315
+ "step": 450
316
+ },
317
+ {
318
+ "epoch": 3.33,
319
+ "learning_rate": 3.6750000000000004e-06,
320
+ "loss": 0.22,
321
+ "step": 460
322
+ },
323
+ {
324
+ "epoch": 3.41,
325
+ "learning_rate": 3.4250000000000007e-06,
326
+ "loss": 0.2151,
327
+ "step": 470
328
+ },
329
+ {
330
+ "epoch": 3.48,
331
+ "learning_rate": 3.175e-06,
332
+ "loss": 0.2082,
333
+ "step": 480
334
+ },
335
+ {
336
+ "epoch": 3.55,
337
+ "learning_rate": 2.925e-06,
338
+ "loss": 0.2014,
339
+ "step": 490
340
+ },
341
+ {
342
+ "epoch": 3.62,
343
+ "learning_rate": 2.6750000000000002e-06,
344
+ "loss": 0.2148,
345
+ "step": 500
346
+ },
347
+ {
348
+ "epoch": 3.62,
349
+ "eval_loss": 0.2666015625,
350
+ "eval_runtime": 152.4154,
351
+ "eval_samples_per_second": 32.411,
352
+ "eval_steps_per_second": 0.066,
353
+ "eval_wer": 0.481927281791959,
354
+ "step": 500
355
+ },
356
+ {
357
+ "epoch": 3.7,
358
+ "learning_rate": 2.425e-06,
359
+ "loss": 0.2158,
360
+ "step": 510
361
+ },
362
+ {
363
+ "epoch": 3.77,
364
+ "learning_rate": 2.1750000000000004e-06,
365
+ "loss": 0.2103,
366
+ "step": 520
367
+ },
368
+ {
369
+ "epoch": 3.84,
370
+ "learning_rate": 1.925e-06,
371
+ "loss": 0.2091,
372
+ "step": 530
373
+ },
374
+ {
375
+ "epoch": 3.91,
376
+ "learning_rate": 1.6750000000000003e-06,
377
+ "loss": 0.1998,
378
+ "step": 540
379
+ },
380
+ {
381
+ "epoch": 3.99,
382
+ "learning_rate": 1.425e-06,
383
+ "loss": 0.2068,
384
+ "step": 550
385
+ },
386
+ {
387
+ "epoch": 4.06,
388
+ "learning_rate": 1.175e-06,
389
+ "loss": 0.212,
390
+ "step": 560
391
+ },
392
+ {
393
+ "epoch": 4.13,
394
+ "learning_rate": 9.25e-07,
395
+ "loss": 0.2034,
396
+ "step": 570
397
+ },
398
+ {
399
+ "epoch": 4.2,
400
+ "learning_rate": 6.750000000000001e-07,
401
+ "loss": 0.2013,
402
+ "step": 580
403
+ },
404
+ {
405
+ "epoch": 4.28,
406
+ "learning_rate": 4.2500000000000006e-07,
407
+ "loss": 0.1919,
408
+ "step": 590
409
+ },
410
+ {
411
+ "epoch": 4.35,
412
+ "learning_rate": 1.7500000000000002e-07,
413
+ "loss": 0.2096,
414
+ "step": 600
415
+ },
416
+ {
417
+ "epoch": 4.35,
418
+ "eval_loss": 0.26123046875,
419
+ "eval_runtime": 154.28,
420
+ "eval_samples_per_second": 32.02,
421
+ "eval_steps_per_second": 0.065,
422
+ "eval_wer": 0.47801004237740824,
423
+ "step": 600
424
+ },
425
+ {
426
+ "epoch": 4.35,
427
+ "step": 600,
428
+ "total_flos": 1.1344381987478569e+19,
429
+ "train_loss": 0.4515265909830729,
430
+ "train_runtime": 14971.1378,
431
+ "train_samples_per_second": 30.779,
432
+ "train_steps_per_second": 0.04
433
+ }
434
+ ],
435
+ "logging_steps": 10,
436
+ "max_steps": 600,
437
+ "num_input_tokens_seen": 0,
438
+ "num_train_epochs": 5,
439
+ "save_steps": 100,
440
+ "total_flos": 1.1344381987478569e+19,
441
+ "train_batch_size": 192,
442
+ "trial_name": null,
443
+ "trial_params": null
444
+ }