DewiBrynJones commited on
Commit
3077817
1 Parent(s): 411e103

End of training

Browse files
README.md CHANGED
@@ -2,6 +2,8 @@
2
  license: apache-2.0
3
  base_model: facebook/wav2vec2-large-xlsr-53
4
  tags:
 
 
5
  - generated_from_trainer
6
  metrics:
7
  - wer
@@ -15,7 +17,7 @@ should probably proofread and complete it, then remove this comment. -->
15
 
16
  # wav2vec2-xlsr-53-ft-btb-ccv-cy
17
 
18
- This model is a fine-tuned version of [facebook/wav2vec2-large-xlsr-53](https://huggingface.co/facebook/wav2vec2-large-xlsr-53) on an unknown dataset.
19
  It achieves the following results on the evaluation set:
20
  - Loss: 0.5865
21
  - Wer: 0.4452
 
2
  license: apache-2.0
3
  base_model: facebook/wav2vec2-large-xlsr-53
4
  tags:
5
+ - automatic-speech-recognition
6
+ - DewiBrynJones/banc-trawsgrifiadau-bangor-clean-with-ccv
7
  - generated_from_trainer
8
  metrics:
9
  - wer
 
17
 
18
  # wav2vec2-xlsr-53-ft-btb-ccv-cy
19
 
20
+ This model is a fine-tuned version of [facebook/wav2vec2-large-xlsr-53](https://huggingface.co/facebook/wav2vec2-large-xlsr-53) on the DEWIBRYNJONES/BANC-TRAWSGRIFIADAU-BANGOR-CLEAN-WITH-CCV - DEFAULT dataset.
21
  It achieves the following results on the evaluation set:
22
  - Loss: 0.5865
23
  - Wer: 0.4452
all_results.json CHANGED
@@ -1,15 +1,15 @@
1
  {
2
- "epoch": 1.008233910267182,
3
- "eval_loss": 0.5155353546142578,
4
- "eval_runtime": 186.6856,
5
  "eval_samples": 7022,
6
- "eval_samples_per_second": 37.614,
7
- "eval_steps_per_second": 2.352,
8
- "eval_wer": 0.39834438406037814,
9
- "total_flos": 6.665403914161851e+18,
10
- "train_loss": 1.086754165649414,
11
- "train_runtime": 4718.794,
12
- "train_samples": 47607,
13
- "train_samples_per_second": 10.172,
14
- "train_steps_per_second": 1.272
15
  }
 
1
  {
2
+ "epoch": 0.38476337052712584,
3
+ "eval_loss": 0.5865370631217957,
4
+ "eval_runtime": 179.3337,
5
  "eval_samples": 7022,
6
+ "eval_samples_per_second": 39.156,
7
+ "eval_steps_per_second": 2.448,
8
+ "eval_wer": 0.44523578575319894,
9
+ "total_flos": 6.835515215409967e+18,
10
+ "train_loss": 0.9274428431193034,
11
+ "train_runtime": 4544.4955,
12
+ "train_samples": 124748,
13
+ "train_samples_per_second": 10.562,
14
+ "train_steps_per_second": 1.32
15
  }
eval_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "epoch": 1.008233910267182,
3
- "eval_loss": 0.5155353546142578,
4
- "eval_runtime": 186.6856,
5
  "eval_samples": 7022,
6
- "eval_samples_per_second": 37.614,
7
- "eval_steps_per_second": 2.352,
8
- "eval_wer": 0.39834438406037814
9
  }
 
1
  {
2
+ "epoch": 0.38476337052712584,
3
+ "eval_loss": 0.5865370631217957,
4
+ "eval_runtime": 179.3337,
5
  "eval_samples": 7022,
6
+ "eval_samples_per_second": 39.156,
7
+ "eval_steps_per_second": 2.448,
8
+ "eval_wer": 0.44523578575319894
9
  }
runs/Aug30_15-47-58_4b35055fdbcb/events.out.tfevents.1725037630.4b35055fdbcb.30.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f2b50ba638d1137f7ceced29f612cfc608a9c7ade1ffa24786817e12c05671ce
3
+ size 406
train_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "epoch": 1.008233910267182,
3
- "total_flos": 6.665403914161851e+18,
4
- "train_loss": 1.086754165649414,
5
- "train_runtime": 4718.794,
6
- "train_samples": 47607,
7
- "train_samples_per_second": 10.172,
8
- "train_steps_per_second": 1.272
9
  }
 
1
  {
2
+ "epoch": 0.38476337052712584,
3
+ "total_flos": 6.835515215409967e+18,
4
+ "train_loss": 0.9274428431193034,
5
+ "train_runtime": 4544.4955,
6
+ "train_samples": 124748,
7
+ "train_samples_per_second": 10.562,
8
+ "train_steps_per_second": 1.32
9
  }
trainer_state.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 1.008233910267182,
5
  "eval_steps": 500,
6
  "global_step": 6000,
7
  "is_hyper_param_search": false,
@@ -9,211 +9,211 @@
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.08401949252226516,
13
- "grad_norm": 19.443201065063477,
14
- "learning_rate": 0.0002455,
15
- "loss": 4.6277,
16
  "step": 500
17
  },
18
  {
19
- "epoch": 0.08401949252226516,
20
- "eval_loss": 1.7780689001083374,
21
- "eval_runtime": 184.9372,
22
- "eval_samples_per_second": 37.97,
23
- "eval_steps_per_second": 2.374,
24
- "eval_wer": 0.9507301452317996,
25
  "step": 500
26
  },
27
  {
28
- "epoch": 0.16803898504453033,
29
- "grad_norm": 10.621150970458984,
30
- "learning_rate": 0.0002782777777777778,
31
- "loss": 1.2514,
32
  "step": 1000
33
  },
34
  {
35
- "epoch": 0.16803898504453033,
36
- "eval_loss": 1.046749472618103,
37
- "eval_runtime": 183.9043,
38
- "eval_samples_per_second": 38.183,
39
- "eval_steps_per_second": 2.387,
40
- "eval_wer": 0.7116623925377695,
41
  "step": 1000
42
  },
43
  {
44
- "epoch": 0.2520584775667955,
45
- "grad_norm": 6.651599884033203,
46
- "learning_rate": 0.00025049999999999996,
47
- "loss": 0.986,
48
  "step": 1500
49
  },
50
  {
51
- "epoch": 0.2520584775667955,
52
- "eval_loss": 0.8940034508705139,
53
- "eval_runtime": 185.3076,
54
- "eval_samples_per_second": 37.894,
55
- "eval_steps_per_second": 2.369,
56
- "eval_wer": 0.6577817935396431,
57
  "step": 1500
58
  },
59
  {
60
- "epoch": 0.33607797008906065,
61
- "grad_norm": 16.908123016357422,
62
- "learning_rate": 0.00022277777777777774,
63
- "loss": 0.8702,
64
  "step": 2000
65
  },
66
  {
67
- "epoch": 0.33607797008906065,
68
- "eval_loss": 0.8157631158828735,
69
- "eval_runtime": 185.5186,
70
- "eval_samples_per_second": 37.851,
71
- "eval_steps_per_second": 2.366,
72
- "eval_wer": 0.5836644122297665,
73
  "step": 2000
74
  },
75
  {
76
- "epoch": 0.4200974626113258,
77
- "grad_norm": 10.515896797180176,
78
- "learning_rate": 0.00019505555555555555,
79
- "loss": 0.8063,
80
  "step": 2500
81
  },
82
  {
83
- "epoch": 0.4200974626113258,
84
- "eval_loss": 0.7131509184837341,
85
- "eval_runtime": 185.8391,
86
- "eval_samples_per_second": 37.785,
87
- "eval_steps_per_second": 2.362,
88
- "eval_wer": 0.5281095948657304,
89
  "step": 2500
90
  },
91
  {
92
- "epoch": 0.504116955133591,
93
- "grad_norm": 3.7379024028778076,
94
- "learning_rate": 0.00016727777777777778,
95
- "loss": 0.7518,
96
  "step": 3000
97
  },
98
  {
99
- "epoch": 0.504116955133591,
100
- "eval_loss": 0.7195897102355957,
101
- "eval_runtime": 183.5821,
102
- "eval_samples_per_second": 38.25,
103
- "eval_steps_per_second": 2.391,
104
- "eval_wer": 0.5187950942744389,
105
  "step": 3000
106
  },
107
  {
108
- "epoch": 0.5881364476558562,
109
- "grad_norm": 5.922393321990967,
110
- "learning_rate": 0.0001395,
111
- "loss": 0.7045,
112
  "step": 3500
113
  },
114
  {
115
- "epoch": 0.5881364476558562,
116
- "eval_loss": 0.6231045722961426,
117
- "eval_runtime": 184.2635,
118
- "eval_samples_per_second": 38.108,
119
- "eval_steps_per_second": 2.382,
120
- "eval_wer": 0.4771256593895747,
121
  "step": 3500
122
  },
123
  {
124
- "epoch": 0.6721559401781213,
125
- "grad_norm": 8.91370964050293,
126
- "learning_rate": 0.00011177777777777777,
127
- "loss": 0.6726,
128
  "step": 4000
129
  },
130
  {
131
- "epoch": 0.6721559401781213,
132
- "eval_loss": 0.6074743270874023,
133
- "eval_runtime": 184.3908,
134
- "eval_samples_per_second": 38.082,
135
- "eval_steps_per_second": 2.381,
136
- "eval_wer": 0.4517333475066105,
137
  "step": 4000
138
  },
139
  {
140
- "epoch": 0.7561754327003865,
141
- "grad_norm": 12.337292671203613,
142
- "learning_rate": 8.405555555555556e-05,
143
- "loss": 0.6355,
144
  "step": 4500
145
  },
146
  {
147
- "epoch": 0.7561754327003865,
148
- "eval_loss": 0.5601897239685059,
149
- "eval_runtime": 184.3021,
150
- "eval_samples_per_second": 38.1,
151
- "eval_steps_per_second": 2.382,
152
- "eval_wer": 0.4328784597191034,
153
  "step": 4500
154
  },
155
  {
156
- "epoch": 0.8401949252226516,
157
- "grad_norm": 18.518247604370117,
158
- "learning_rate": 5.6333333333333325e-05,
159
- "loss": 0.5938,
160
  "step": 5000
161
  },
162
  {
163
- "epoch": 0.8401949252226516,
164
- "eval_loss": 0.5438016653060913,
165
- "eval_runtime": 185.1047,
166
- "eval_samples_per_second": 37.935,
167
- "eval_steps_per_second": 2.372,
168
- "eval_wer": 0.4225939754713722,
169
  "step": 5000
170
  },
171
  {
172
- "epoch": 0.9242144177449169,
173
- "grad_norm": 5.622241020202637,
174
- "learning_rate": 2.8555555555555556e-05,
175
- "loss": 0.5842,
176
  "step": 5500
177
  },
178
  {
179
- "epoch": 0.9242144177449169,
180
- "eval_loss": 0.5245193839073181,
181
- "eval_runtime": 184.9427,
182
- "eval_samples_per_second": 37.969,
183
- "eval_steps_per_second": 2.374,
184
- "eval_wer": 0.4090939289653065,
185
  "step": 5500
186
  },
187
  {
188
- "epoch": 1.008233910267182,
189
- "grad_norm": 10.519143104553223,
190
- "learning_rate": 7.777777777777777e-07,
191
- "loss": 0.557,
192
  "step": 6000
193
  },
194
  {
195
- "epoch": 1.008233910267182,
196
- "eval_loss": 0.5155353546142578,
197
- "eval_runtime": 185.543,
198
- "eval_samples_per_second": 37.846,
199
- "eval_steps_per_second": 2.366,
200
- "eval_wer": 0.39834438406037814,
201
  "step": 6000
202
  },
203
  {
204
- "epoch": 1.008233910267182,
205
  "step": 6000,
206
- "total_flos": 6.665403914161851e+18,
207
- "train_loss": 1.086754165649414,
208
- "train_runtime": 4718.794,
209
- "train_samples_per_second": 10.172,
210
- "train_steps_per_second": 1.272
211
  }
212
  ],
213
  "logging_steps": 500,
214
  "max_steps": 6000,
215
  "num_input_tokens_seen": 0,
216
- "num_train_epochs": 2,
217
  "save_steps": 500,
218
  "stateful_callbacks": {
219
  "TrainerControl": {
@@ -227,7 +227,7 @@
227
  "attributes": {}
228
  }
229
  },
230
- "total_flos": 6.665403914161851e+18,
231
  "train_batch_size": 8,
232
  "trial_name": null,
233
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.38476337052712584,
5
  "eval_steps": 500,
6
  "global_step": 6000,
7
  "is_hyper_param_search": false,
 
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.03206361421059382,
13
+ "grad_norm": 10.316516876220703,
14
+ "learning_rate": 0.0002465,
15
+ "loss": 4.7051,
16
  "step": 500
17
  },
18
  {
19
+ "epoch": 0.03206361421059382,
20
+ "eval_loss": 1.6561740636825562,
21
+ "eval_runtime": 191.0416,
22
+ "eval_samples_per_second": 36.756,
23
+ "eval_steps_per_second": 2.298,
24
+ "eval_wer": 0.9354894431230816,
25
  "step": 500
26
  },
27
  {
28
+ "epoch": 0.06412722842118763,
29
+ "grad_norm": 4.912766933441162,
30
+ "learning_rate": 0.00027816666666666663,
31
+ "loss": 1.0362,
32
  "step": 1000
33
  },
34
  {
35
+ "epoch": 0.06412722842118763,
36
+ "eval_loss": 1.1839842796325684,
37
+ "eval_runtime": 175.5788,
38
+ "eval_samples_per_second": 39.993,
39
+ "eval_steps_per_second": 2.5,
40
+ "eval_wer": 0.7977517639086356,
41
  "step": 1000
42
  },
43
  {
44
+ "epoch": 0.09619084263178146,
45
+ "grad_norm": 4.178534030914307,
46
+ "learning_rate": 0.00025038888888888886,
47
+ "loss": 0.811,
48
  "step": 1500
49
  },
50
  {
51
+ "epoch": 0.09619084263178146,
52
+ "eval_loss": 1.0081175565719604,
53
+ "eval_runtime": 175.5534,
54
+ "eval_samples_per_second": 39.999,
55
+ "eval_steps_per_second": 2.501,
56
+ "eval_wer": 0.7174690070290597,
57
  "step": 1500
58
  },
59
  {
60
+ "epoch": 0.12825445684237527,
61
+ "grad_norm": 7.957609176635742,
62
+ "learning_rate": 0.0002226111111111111,
63
+ "loss": 0.6903,
64
  "step": 2000
65
  },
66
  {
67
+ "epoch": 0.12825445684237527,
68
+ "eval_loss": 0.8935067057609558,
69
+ "eval_runtime": 176.1028,
70
+ "eval_samples_per_second": 39.874,
71
+ "eval_steps_per_second": 2.493,
72
+ "eval_wer": 0.6401094885661516,
73
  "step": 2000
74
  },
75
  {
76
+ "epoch": 0.16031807105296908,
77
+ "grad_norm": 6.541042327880859,
78
+ "learning_rate": 0.00019483333333333332,
79
+ "loss": 0.6238,
80
  "step": 2500
81
  },
82
  {
83
+ "epoch": 0.16031807105296908,
84
+ "eval_loss": 0.8059775233268738,
85
+ "eval_runtime": 177.0587,
86
+ "eval_samples_per_second": 39.659,
87
+ "eval_steps_per_second": 2.479,
88
+ "eval_wer": 0.5848868573858276,
89
  "step": 2500
90
  },
91
  {
92
+ "epoch": 0.19238168526356292,
93
+ "grad_norm": 5.036514759063721,
94
+ "learning_rate": 0.00016705555555555554,
95
+ "loss": 0.5649,
96
  "step": 3000
97
  },
98
  {
99
+ "epoch": 0.19238168526356292,
100
+ "eval_loss": 0.7770201563835144,
101
+ "eval_runtime": 178.1454,
102
+ "eval_samples_per_second": 39.417,
103
+ "eval_steps_per_second": 2.464,
104
+ "eval_wer": 0.5589231852668783,
105
  "step": 3000
106
  },
107
  {
108
+ "epoch": 0.22444529947415673,
109
+ "grad_norm": 4.140881538391113,
110
+ "learning_rate": 0.00013927777777777777,
111
+ "loss": 0.5309,
112
  "step": 3500
113
  },
114
  {
115
+ "epoch": 0.22444529947415673,
116
+ "eval_loss": 0.7264481782913208,
117
+ "eval_runtime": 176.7301,
118
+ "eval_samples_per_second": 39.733,
119
+ "eval_steps_per_second": 2.484,
120
+ "eval_wer": 0.5326539018589139,
121
  "step": 3500
122
  },
123
  {
124
+ "epoch": 0.25650891368475054,
125
+ "grad_norm": 6.205782413482666,
126
+ "learning_rate": 0.00011155555555555555,
127
+ "loss": 0.4892,
128
  "step": 4000
129
  },
130
  {
131
+ "epoch": 0.25650891368475054,
132
+ "eval_loss": 0.6865007877349854,
133
+ "eval_runtime": 178.7785,
134
+ "eval_samples_per_second": 39.278,
135
+ "eval_steps_per_second": 2.456,
136
+ "eval_wer": 0.5106366016024662,
137
  "step": 4000
138
  },
139
  {
140
+ "epoch": 0.2885725278953444,
141
+ "grad_norm": 9.618443489074707,
142
+ "learning_rate": 8.388888888888888e-05,
143
+ "loss": 0.4521,
144
  "step": 4500
145
  },
146
  {
147
+ "epoch": 0.2885725278953444,
148
+ "eval_loss": 0.6477864980697632,
149
+ "eval_runtime": 177.7072,
150
+ "eval_samples_per_second": 39.514,
151
+ "eval_steps_per_second": 2.47,
152
+ "eval_wer": 0.4861345486918508,
153
  "step": 4500
154
  },
155
  {
156
+ "epoch": 0.32063614210593816,
157
+ "grad_norm": 8.743291854858398,
158
+ "learning_rate": 5.61111111111111e-05,
159
+ "loss": 0.4309,
160
  "step": 5000
161
  },
162
  {
163
+ "epoch": 0.32063614210593816,
164
+ "eval_loss": 0.6221807599067688,
165
+ "eval_runtime": 177.9115,
166
+ "eval_samples_per_second": 39.469,
167
+ "eval_steps_per_second": 2.468,
168
+ "eval_wer": 0.4763416999960138,
169
  "step": 5000
170
  },
171
  {
172
+ "epoch": 0.352699756316532,
173
+ "grad_norm": 8.870036125183105,
174
+ "learning_rate": 2.833333333333333e-05,
175
+ "loss": 0.4055,
176
  "step": 5500
177
  },
178
  {
179
+ "epoch": 0.352699756316532,
180
+ "eval_loss": 0.5988152027130127,
181
+ "eval_runtime": 178.6515,
182
+ "eval_samples_per_second": 39.306,
183
+ "eval_steps_per_second": 2.457,
184
+ "eval_wer": 0.45257045668956536,
185
  "step": 5500
186
  },
187
  {
188
+ "epoch": 0.38476337052712584,
189
+ "grad_norm": 14.018965721130371,
190
+ "learning_rate": 6.11111111111111e-07,
191
+ "loss": 0.3896,
192
  "step": 6000
193
  },
194
  {
195
+ "epoch": 0.38476337052712584,
196
+ "eval_loss": 0.5865370631217957,
197
+ "eval_runtime": 176.8507,
198
+ "eval_samples_per_second": 39.706,
199
+ "eval_steps_per_second": 2.482,
200
+ "eval_wer": 0.44523578575319894,
201
  "step": 6000
202
  },
203
  {
204
+ "epoch": 0.38476337052712584,
205
  "step": 6000,
206
+ "total_flos": 6.835515215409967e+18,
207
+ "train_loss": 0.9274428431193034,
208
+ "train_runtime": 4544.4955,
209
+ "train_samples_per_second": 10.562,
210
+ "train_steps_per_second": 1.32
211
  }
212
  ],
213
  "logging_steps": 500,
214
  "max_steps": 6000,
215
  "num_input_tokens_seen": 0,
216
+ "num_train_epochs": 1,
217
  "save_steps": 500,
218
  "stateful_callbacks": {
219
  "TrainerControl": {
 
227
  "attributes": {}
228
  }
229
  },
230
+ "total_flos": 6.835515215409967e+18,
231
  "train_batch_size": 8,
232
  "trial_name": null,
233
  "trial_params": null