drmeeseeks commited on
Commit
96dccab
1 Parent(s): f4a81be

End of training

Browse files
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
  "epoch": 2000.0,
3
- "eval_loss": 6.801175117492676,
4
- "eval_runtime": 8.6897,
5
- "eval_samples": 5,
6
- "eval_samples_per_second": 0.575,
7
- "eval_steps_per_second": 0.115,
8
- "eval_wer": 100.0,
9
  "train_loss": 0.10164999849759625,
10
- "train_runtime": 1221.0979,
11
- "train_samples_per_second": 104.824,
12
- "train_steps_per_second": 1.638
13
  }
 
1
  {
2
  "epoch": 2000.0,
3
+ "eval_loss": 6.883942604064941,
4
+ "eval_runtime": 28.6806,
5
+ "eval_samples": 20,
6
+ "eval_samples_per_second": 0.697,
7
+ "eval_steps_per_second": 0.035,
8
+ "eval_wer": 103.08219178082192,
9
  "train_loss": 0.10164999849759625,
10
+ "train_runtime": 954.9086,
11
+ "train_samples_per_second": 134.044,
12
+ "train_steps_per_second": 2.094
13
  }
eval_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "epoch": 2000.0,
3
- "eval_loss": 6.801175117492676,
4
- "eval_runtime": 8.6897,
5
- "eval_samples": 5,
6
- "eval_samples_per_second": 0.575,
7
- "eval_steps_per_second": 0.115,
8
- "eval_wer": 100.0
9
  }
 
1
  {
2
  "epoch": 2000.0,
3
+ "eval_loss": 6.883942604064941,
4
+ "eval_runtime": 28.6806,
5
+ "eval_samples": 20,
6
+ "eval_samples_per_second": 0.697,
7
+ "eval_steps_per_second": 0.035,
8
+ "eval_wer": 103.08219178082192
9
  }
runs/Dec25_16-23-07_129-213-85-198/events.out.tfevents.1671986446.129-213-85-198.81515.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:07668bdce15340b34014a604d805cb80d0d496645c8f0ea6b507f53e8fe3602b
3
+ size 358
train_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "epoch": 2000.0,
3
  "train_loss": 0.10164999849759625,
4
- "train_runtime": 1221.0979,
5
- "train_samples_per_second": 104.824,
6
- "train_steps_per_second": 1.638
7
  }
 
1
  {
2
  "epoch": 2000.0,
3
  "train_loss": 0.10164999849759625,
4
+ "train_runtime": 954.9086,
5
+ "train_samples_per_second": 134.044,
6
+ "train_steps_per_second": 2.094
7
  }
trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "best_metric": 100.0,
3
- "best_model_checkpoint": "./whisper-small-amet/checkpoint-1100",
4
  "epoch": 2000.0,
5
  "global_step": 2000,
6
  "is_hyper_param_search": false,
@@ -33,11 +33,11 @@
33
  },
34
  {
35
  "epoch": 100.0,
36
- "eval_loss": 2.7051408290863037,
37
- "eval_runtime": 8.4302,
38
- "eval_samples_per_second": 0.593,
39
- "eval_steps_per_second": 0.119,
40
- "eval_wer": 276.0,
41
  "step": 100
42
  },
43
  {
@@ -66,11 +66,11 @@
66
  },
67
  {
68
  "epoch": 200.0,
69
- "eval_loss": 3.741528034210205,
70
- "eval_runtime": 8.6419,
71
- "eval_samples_per_second": 0.579,
72
- "eval_steps_per_second": 0.116,
73
- "eval_wer": 334.6666666666667,
74
  "step": 200
75
  },
76
  {
@@ -99,11 +99,11 @@
99
  },
100
  {
101
  "epoch": 300.0,
102
- "eval_loss": 3.840170383453369,
103
- "eval_runtime": 1.5102,
104
- "eval_samples_per_second": 3.311,
105
- "eval_steps_per_second": 0.662,
106
- "eval_wer": 117.33333333333333,
107
  "step": 300
108
  },
109
  {
@@ -132,11 +132,11 @@
132
  },
133
  {
134
  "epoch": 400.0,
135
- "eval_loss": 3.8931400775909424,
136
- "eval_runtime": 8.4556,
137
- "eval_samples_per_second": 0.591,
138
- "eval_steps_per_second": 0.118,
139
- "eval_wer": 340.0,
140
  "step": 400
141
  },
142
  {
@@ -165,11 +165,11 @@
165
  },
166
  {
167
  "epoch": 500.0,
168
- "eval_loss": 4.06705904006958,
169
- "eval_runtime": 8.4836,
170
- "eval_samples_per_second": 0.589,
171
- "eval_steps_per_second": 0.118,
172
- "eval_wer": 397.3333333333333,
173
  "step": 500
174
  },
175
  {
@@ -198,11 +198,11 @@
198
  },
199
  {
200
  "epoch": 600.0,
201
- "eval_loss": 4.284416675567627,
202
- "eval_runtime": 1.5895,
203
- "eval_samples_per_second": 3.146,
204
- "eval_steps_per_second": 0.629,
205
- "eval_wer": 137.33333333333334,
206
  "step": 600
207
  },
208
  {
@@ -231,11 +231,11 @@
231
  },
232
  {
233
  "epoch": 700.0,
234
- "eval_loss": 4.469689846038818,
235
- "eval_runtime": 4.8142,
236
- "eval_samples_per_second": 1.039,
237
- "eval_steps_per_second": 0.208,
238
- "eval_wer": 289.33333333333337,
239
  "step": 700
240
  },
241
  {
@@ -264,11 +264,11 @@
264
  },
265
  {
266
  "epoch": 800.0,
267
- "eval_loss": 4.627803325653076,
268
- "eval_runtime": 8.4484,
269
- "eval_samples_per_second": 0.592,
270
- "eval_steps_per_second": 0.118,
271
- "eval_wer": 449.3333333333333,
272
  "step": 800
273
  },
274
  {
@@ -297,11 +297,11 @@
297
  },
298
  {
299
  "epoch": 900.0,
300
- "eval_loss": 4.779428005218506,
301
- "eval_runtime": 8.432,
302
- "eval_samples_per_second": 0.593,
303
- "eval_steps_per_second": 0.119,
304
- "eval_wer": 678.6666666666667,
305
  "step": 900
306
  },
307
  {
@@ -330,11 +330,11 @@
330
  },
331
  {
332
  "epoch": 1000.0,
333
- "eval_loss": 4.676939487457275,
334
- "eval_runtime": 8.4726,
335
- "eval_samples_per_second": 0.59,
336
- "eval_steps_per_second": 0.118,
337
- "eval_wer": 261.3333333333333,
338
  "step": 1000
339
  },
340
  {
@@ -363,11 +363,11 @@
363
  },
364
  {
365
  "epoch": 1100.0,
366
- "eval_loss": 5.499487400054932,
367
- "eval_runtime": 8.5264,
368
- "eval_samples_per_second": 0.586,
369
- "eval_steps_per_second": 0.117,
370
- "eval_wer": 100.0,
371
  "step": 1100
372
  },
373
  {
@@ -396,11 +396,11 @@
396
  },
397
  {
398
  "epoch": 1200.0,
399
- "eval_loss": 6.003348350524902,
400
- "eval_runtime": 8.4985,
401
- "eval_samples_per_second": 0.588,
402
- "eval_steps_per_second": 0.118,
403
- "eval_wer": 100.0,
404
  "step": 1200
405
  },
406
  {
@@ -429,11 +429,11 @@
429
  },
430
  {
431
  "epoch": 1300.0,
432
- "eval_loss": 6.288400650024414,
433
- "eval_runtime": 8.612,
434
- "eval_samples_per_second": 0.581,
435
- "eval_steps_per_second": 0.116,
436
- "eval_wer": 100.0,
437
  "step": 1300
438
  },
439
  {
@@ -462,11 +462,11 @@
462
  },
463
  {
464
  "epoch": 1400.0,
465
- "eval_loss": 6.474369049072266,
466
- "eval_runtime": 8.436,
467
- "eval_samples_per_second": 0.593,
468
- "eval_steps_per_second": 0.119,
469
- "eval_wer": 100.0,
470
  "step": 1400
471
  },
472
  {
@@ -495,11 +495,11 @@
495
  },
496
  {
497
  "epoch": 1500.0,
498
- "eval_loss": 6.596408843994141,
499
- "eval_runtime": 8.5317,
500
- "eval_samples_per_second": 0.586,
501
- "eval_steps_per_second": 0.117,
502
- "eval_wer": 100.0,
503
  "step": 1500
504
  },
505
  {
@@ -528,11 +528,11 @@
528
  },
529
  {
530
  "epoch": 1600.0,
531
- "eval_loss": 6.679154872894287,
532
- "eval_runtime": 8.5665,
533
- "eval_samples_per_second": 0.584,
534
- "eval_steps_per_second": 0.117,
535
- "eval_wer": 100.0,
536
  "step": 1600
537
  },
538
  {
@@ -561,11 +561,11 @@
561
  },
562
  {
563
  "epoch": 1700.0,
564
- "eval_loss": 6.7370285987854,
565
- "eval_runtime": 8.4426,
566
- "eval_samples_per_second": 0.592,
567
- "eval_steps_per_second": 0.118,
568
- "eval_wer": 100.0,
569
  "step": 1700
570
  },
571
  {
@@ -594,11 +594,11 @@
594
  },
595
  {
596
  "epoch": 1800.0,
597
- "eval_loss": 6.773484230041504,
598
- "eval_runtime": 8.4858,
599
- "eval_samples_per_second": 0.589,
600
- "eval_steps_per_second": 0.118,
601
- "eval_wer": 100.0,
602
  "step": 1800
603
  },
604
  {
@@ -627,11 +627,11 @@
627
  },
628
  {
629
  "epoch": 1900.0,
630
- "eval_loss": 6.795783042907715,
631
- "eval_runtime": 8.5107,
632
- "eval_samples_per_second": 0.587,
633
- "eval_steps_per_second": 0.117,
634
- "eval_wer": 100.0,
635
  "step": 1900
636
  },
637
  {
@@ -660,11 +660,11 @@
660
  },
661
  {
662
  "epoch": 2000.0,
663
- "eval_loss": 6.801175117492676,
664
- "eval_runtime": 8.5138,
665
- "eval_samples_per_second": 0.587,
666
- "eval_steps_per_second": 0.117,
667
- "eval_wer": 100.0,
668
  "step": 2000
669
  },
670
  {
@@ -672,9 +672,9 @@
672
  "step": 2000,
673
  "total_flos": 5.7717080064e+17,
674
  "train_loss": 0.10164999849759625,
675
- "train_runtime": 1221.0979,
676
- "train_samples_per_second": 104.824,
677
- "train_steps_per_second": 1.638
678
  }
679
  ],
680
  "max_steps": 2000,
 
1
  {
2
+ "best_metric": 103.08219178082192,
3
+ "best_model_checkpoint": "./whisper-small-amet/checkpoint-2000",
4
  "epoch": 2000.0,
5
  "global_step": 2000,
6
  "is_hyper_param_search": false,
 
33
  },
34
  {
35
  "epoch": 100.0,
36
+ "eval_loss": 2.7089741230010986,
37
+ "eval_runtime": 28.1806,
38
+ "eval_samples_per_second": 0.71,
39
+ "eval_steps_per_second": 0.035,
40
+ "eval_wer": 171.57534246575344,
41
  "step": 100
42
  },
43
  {
 
66
  },
67
  {
68
  "epoch": 200.0,
69
+ "eval_loss": 3.7302818298339844,
70
+ "eval_runtime": 28.2207,
71
+ "eval_samples_per_second": 0.709,
72
+ "eval_steps_per_second": 0.035,
73
+ "eval_wer": 298.63013698630135,
74
  "step": 200
75
  },
76
  {
 
99
  },
100
  {
101
  "epoch": 300.0,
102
+ "eval_loss": 3.8286595344543457,
103
+ "eval_runtime": 28.3319,
104
+ "eval_samples_per_second": 0.706,
105
+ "eval_steps_per_second": 0.035,
106
+ "eval_wer": 239.3835616438356,
107
  "step": 300
108
  },
109
  {
 
132
  },
133
  {
134
  "epoch": 400.0,
135
+ "eval_loss": 3.8876891136169434,
136
+ "eval_runtime": 28.3964,
137
+ "eval_samples_per_second": 0.704,
138
+ "eval_steps_per_second": 0.035,
139
+ "eval_wer": 234.93150684931504,
140
  "step": 400
141
  },
142
  {
 
165
  },
166
  {
167
  "epoch": 500.0,
168
+ "eval_loss": 4.056136608123779,
169
+ "eval_runtime": 28.2255,
170
+ "eval_samples_per_second": 0.709,
171
+ "eval_steps_per_second": 0.035,
172
+ "eval_wer": 316.4383561643836,
173
  "step": 500
174
  },
175
  {
 
198
  },
199
  {
200
  "epoch": 600.0,
201
+ "eval_loss": 4.270617485046387,
202
+ "eval_runtime": 28.1771,
203
+ "eval_samples_per_second": 0.71,
204
+ "eval_steps_per_second": 0.035,
205
+ "eval_wer": 189.04109589041096,
206
  "step": 600
207
  },
208
  {
 
231
  },
232
  {
233
  "epoch": 700.0,
234
+ "eval_loss": 4.452445030212402,
235
+ "eval_runtime": 28.3415,
236
+ "eval_samples_per_second": 0.706,
237
+ "eval_steps_per_second": 0.035,
238
+ "eval_wer": 229.45205479452056,
239
  "step": 700
240
  },
241
  {
 
264
  },
265
  {
266
  "epoch": 800.0,
267
+ "eval_loss": 4.625022888183594,
268
+ "eval_runtime": 28.3479,
269
+ "eval_samples_per_second": 0.706,
270
+ "eval_steps_per_second": 0.035,
271
+ "eval_wer": 308.5616438356164,
272
  "step": 800
273
  },
274
  {
 
297
  },
298
  {
299
  "epoch": 900.0,
300
+ "eval_loss": 4.784408092498779,
301
+ "eval_runtime": 28.2633,
302
+ "eval_samples_per_second": 0.708,
303
+ "eval_steps_per_second": 0.035,
304
+ "eval_wer": 429.4520547945205,
305
  "step": 900
306
  },
307
  {
 
330
  },
331
  {
332
  "epoch": 1000.0,
333
+ "eval_loss": 4.618178367614746,
334
+ "eval_runtime": 28.5252,
335
+ "eval_samples_per_second": 0.701,
336
+ "eval_steps_per_second": 0.035,
337
+ "eval_wer": 206.84931506849313,
338
  "step": 1000
339
  },
340
  {
 
363
  },
364
  {
365
  "epoch": 1100.0,
366
+ "eval_loss": 5.542290687561035,
367
+ "eval_runtime": 28.5497,
368
+ "eval_samples_per_second": 0.701,
369
+ "eval_steps_per_second": 0.035,
370
+ "eval_wer": 159.93150684931507,
371
  "step": 1100
372
  },
373
  {
 
396
  },
397
  {
398
  "epoch": 1200.0,
399
+ "eval_loss": 6.0516815185546875,
400
+ "eval_runtime": 28.4295,
401
+ "eval_samples_per_second": 0.703,
402
+ "eval_steps_per_second": 0.035,
403
+ "eval_wer": 151.7123287671233,
404
  "step": 1200
405
  },
406
  {
 
429
  },
430
  {
431
  "epoch": 1300.0,
432
+ "eval_loss": 6.349332332611084,
433
+ "eval_runtime": 28.5448,
434
+ "eval_samples_per_second": 0.701,
435
+ "eval_steps_per_second": 0.035,
436
+ "eval_wer": 154.7945205479452,
437
  "step": 1300
438
  },
439
  {
 
462
  },
463
  {
464
  "epoch": 1400.0,
465
+ "eval_loss": 6.543065547943115,
466
+ "eval_runtime": 28.5232,
467
+ "eval_samples_per_second": 0.701,
468
+ "eval_steps_per_second": 0.035,
469
+ "eval_wer": 138.6986301369863,
470
  "step": 1400
471
  },
472
  {
 
495
  },
496
  {
497
  "epoch": 1500.0,
498
+ "eval_loss": 6.669939994812012,
499
+ "eval_runtime": 28.5345,
500
+ "eval_samples_per_second": 0.701,
501
+ "eval_steps_per_second": 0.035,
502
+ "eval_wer": 158.56164383561645,
503
  "step": 1500
504
  },
505
  {
 
528
  },
529
  {
530
  "epoch": 1600.0,
531
+ "eval_loss": 6.759077548980713,
532
+ "eval_runtime": 28.534,
533
+ "eval_samples_per_second": 0.701,
534
+ "eval_steps_per_second": 0.035,
535
+ "eval_wer": 160.27397260273972,
536
  "step": 1600
537
  },
538
  {
 
561
  },
562
  {
563
  "epoch": 1700.0,
564
+ "eval_loss": 6.82085657119751,
565
+ "eval_runtime": 28.5933,
566
+ "eval_samples_per_second": 0.699,
567
+ "eval_steps_per_second": 0.035,
568
+ "eval_wer": 103.08219178082192,
569
  "step": 1700
570
  },
571
  {
 
594
  },
595
  {
596
  "epoch": 1800.0,
597
+ "eval_loss": 6.856205940246582,
598
+ "eval_runtime": 28.571,
599
+ "eval_samples_per_second": 0.7,
600
+ "eval_steps_per_second": 0.035,
601
+ "eval_wer": 103.08219178082192,
602
  "step": 1800
603
  },
604
  {
 
627
  },
628
  {
629
  "epoch": 1900.0,
630
+ "eval_loss": 6.875776767730713,
631
+ "eval_runtime": 28.4345,
632
+ "eval_samples_per_second": 0.703,
633
+ "eval_steps_per_second": 0.035,
634
+ "eval_wer": 103.08219178082192,
635
  "step": 1900
636
  },
637
  {
 
660
  },
661
  {
662
  "epoch": 2000.0,
663
+ "eval_loss": 6.883942604064941,
664
+ "eval_runtime": 28.4855,
665
+ "eval_samples_per_second": 0.702,
666
+ "eval_steps_per_second": 0.035,
667
+ "eval_wer": 103.08219178082192,
668
  "step": 2000
669
  },
670
  {
 
672
  "step": 2000,
673
  "total_flos": 5.7717080064e+17,
674
  "train_loss": 0.10164999849759625,
675
+ "train_runtime": 954.9086,
676
+ "train_samples_per_second": 134.044,
677
+ "train_steps_per_second": 2.094
678
  }
679
  ],
680
  "max_steps": 2000,