qmeeus commited on
Commit
793067e
1 Parent(s): 0cd6dfd

End of training

Browse files
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
- "epoch": 1.19,
3
- "eval_loss": 0.38643914461135864,
4
- "eval_runtime": 204.4048,
5
- "eval_samples": 1000,
6
- "eval_samples_per_second": 4.892,
7
- "eval_steps_per_second": 0.078,
8
- "eval_wer": 18.367063400175983,
9
- "train_loss": 0.4157425765991211,
10
- "train_runtime": 7330.7001,
11
- "train_samples_per_second": 69.843,
12
- "train_steps_per_second": 0.136
13
  }
 
1
  {
2
+ "epoch": 14.04,
3
+ "eval_loss": 0.30335742235183716,
4
+ "eval_runtime": 1122.4749,
5
+ "eval_samples": 5000,
6
+ "eval_samples_per_second": 4.454,
7
+ "eval_steps_per_second": 0.557,
8
+ "eval_wer": 14.535443909153475,
9
+ "train_loss": 0.0768378963470459,
10
+ "train_runtime": 74057.892,
11
+ "train_samples_per_second": 17.284,
12
+ "train_steps_per_second": 0.135
13
  }
eval_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "epoch": 1.19,
3
- "eval_loss": 0.38643914461135864,
4
- "eval_runtime": 204.4048,
5
- "eval_samples": 1000,
6
- "eval_samples_per_second": 4.892,
7
- "eval_steps_per_second": 0.078,
8
- "eval_wer": 18.367063400175983
9
  }
 
1
  {
2
+ "epoch": 14.04,
3
+ "eval_loss": 0.30335742235183716,
4
+ "eval_runtime": 1122.4749,
5
+ "eval_samples": 5000,
6
+ "eval_samples_per_second": 4.454,
7
+ "eval_steps_per_second": 0.557,
8
+ "eval_wer": 14.535443909153475
9
  }
runs/Dec15_19-32-56_129-146-3-150/events.out.tfevents.1671208059.129-146-3-150.88241.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4348091858c4f36346386139f256e83dac46e73911a6c38b599d7cfdf598df5f
3
+ size 358
train_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "epoch": 1.19,
3
- "train_loss": 0.4157425765991211,
4
- "train_runtime": 7330.7001,
5
- "train_samples_per_second": 69.843,
6
- "train_steps_per_second": 0.136
7
  }
 
1
  {
2
+ "epoch": 14.04,
3
+ "train_loss": 0.0768378963470459,
4
+ "train_runtime": 74057.892,
5
+ "train_samples_per_second": 17.284,
6
+ "train_steps_per_second": 0.135
7
  }
trainer_state.json CHANGED
@@ -1,175 +1,235 @@
1
  {
2
- "best_metric": 18.367063400175983,
3
- "best_model_checkpoint": "./whisper-small-nl/checkpoint-600",
4
- "epoch": 1.194,
5
- "global_step": 1000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
- "epoch": 0.1,
12
- "learning_rate": 9.473684210526315e-06,
13
- "loss": 0.8378,
14
- "step": 100
15
  },
16
  {
17
- "epoch": 0.1,
18
- "eval_loss": 0.4932844042778015,
19
- "eval_runtime": 153.0661,
20
- "eval_samples_per_second": 6.533,
21
- "eval_steps_per_second": 0.105,
22
- "eval_wer": 23.882739776779513,
23
- "step": 100
24
  },
25
  {
26
- "epoch": 0.2,
27
- "learning_rate": 8.421052631578948e-06,
28
- "loss": 0.5547,
29
- "step": 200
 
 
 
30
  },
31
  {
32
- "epoch": 0.2,
33
- "eval_loss": 0.44761189818382263,
34
- "eval_runtime": 154.0782,
35
- "eval_samples_per_second": 6.49,
36
- "eval_steps_per_second": 0.104,
37
- "eval_wer": 21.057750196823044,
38
- "step": 200
39
  },
40
  {
41
- "epoch": 0.3,
42
- "learning_rate": 7.368421052631579e-06,
43
- "loss": 0.3905,
44
- "step": 300
45
  },
46
  {
47
- "epoch": 0.3,
48
- "eval_loss": 0.4335392117500305,
49
- "eval_runtime": 152.7461,
50
- "eval_samples_per_second": 6.547,
51
- "eval_steps_per_second": 0.105,
52
- "eval_wer": 21.168897327837723,
53
- "step": 300
54
  },
55
  {
56
- "epoch": 0.4,
57
- "learning_rate": 6.31578947368421e-06,
58
- "loss": 0.3766,
59
- "step": 400
60
  },
61
  {
62
- "epoch": 0.4,
63
- "eval_loss": 0.4266929030418396,
64
- "eval_runtime": 150.336,
65
- "eval_samples_per_second": 6.652,
66
- "eval_steps_per_second": 0.106,
67
- "eval_wer": 20.052794887231972,
68
- "step": 400
69
  },
70
  {
71
- "epoch": 0.5,
72
- "learning_rate": 5.263157894736842e-06,
73
- "loss": 0.4164,
74
- "step": 500
 
 
 
75
  },
76
  {
77
- "epoch": 0.5,
78
- "eval_loss": 0.4138640761375427,
79
- "eval_runtime": 157.7477,
80
- "eval_samples_per_second": 6.339,
81
- "eval_steps_per_second": 0.101,
82
- "eval_wer": 21.43287176399759,
83
- "step": 500
84
  },
85
  {
86
- "epoch": 0.6,
87
- "learning_rate": 4.210526315789474e-06,
88
- "loss": 0.2939,
89
- "step": 600
90
  },
91
  {
92
- "epoch": 0.6,
93
- "eval_loss": 0.38643914461135864,
94
- "eval_runtime": 151.6414,
95
- "eval_samples_per_second": 6.595,
96
- "eval_steps_per_second": 0.106,
97
- "eval_wer": 18.367063400175983,
98
- "step": 600
99
  },
100
  {
101
- "epoch": 0.7,
102
- "learning_rate": 3.157894736842105e-06,
103
- "loss": 0.2632,
104
- "step": 700
105
  },
106
  {
107
- "epoch": 0.7,
108
- "eval_loss": 0.3864086866378784,
109
- "eval_runtime": 152.5897,
110
- "eval_samples_per_second": 6.554,
111
- "eval_steps_per_second": 0.105,
112
- "eval_wer": 18.431899226601214,
113
- "step": 700
114
  },
115
  {
116
- "epoch": 0.8,
117
- "learning_rate": 2.105263157894737e-06,
118
- "loss": 0.6066,
119
- "step": 800
 
 
 
120
  },
121
  {
122
- "epoch": 0.8,
123
- "eval_loss": 0.3804214298725128,
124
- "eval_runtime": 156.1258,
125
- "eval_samples_per_second": 6.405,
126
- "eval_steps_per_second": 0.102,
127
- "eval_wer": 19.27476497012921,
128
- "step": 800
129
  },
130
  {
131
- "epoch": 1.09,
132
- "learning_rate": 1.0526315789473685e-06,
133
- "loss": 0.2075,
134
- "step": 900
135
  },
136
  {
137
- "epoch": 1.09,
138
- "eval_loss": 0.3793680667877197,
139
- "eval_runtime": 153.2522,
140
- "eval_samples_per_second": 6.525,
141
- "eval_steps_per_second": 0.104,
142
- "eval_wer": 18.890381142036773,
143
- "step": 900
144
  },
145
  {
146
- "epoch": 1.19,
147
- "learning_rate": 0.0,
148
- "loss": 0.2102,
149
- "step": 1000
150
  },
151
  {
152
- "epoch": 1.19,
153
- "eval_loss": 0.37768101692199707,
154
- "eval_runtime": 153.5387,
155
- "eval_samples_per_second": 6.513,
156
- "eval_steps_per_second": 0.104,
157
- "eval_wer": 19.88144306025101,
158
- "step": 1000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
159
  },
160
  {
161
- "epoch": 1.19,
162
- "step": 1000,
163
- "total_flos": 1.84579222044672e+19,
164
- "train_loss": 0.4157425765991211,
165
- "train_runtime": 7330.7001,
166
- "train_samples_per_second": 69.843,
167
- "train_steps_per_second": 0.136
168
  }
169
  ],
170
- "max_steps": 1000,
171
  "num_train_epochs": 9223372036854775807,
172
- "total_flos": 1.84579222044672e+19,
173
  "trial_name": null,
174
  "trial_params": null
175
  }
 
1
  {
2
+ "best_metric": 14.535443909153475,
3
+ "best_model_checkpoint": "whisper-small-nl/checkpoint-10000",
4
+ "epoch": 14.0372,
5
+ "global_step": 10000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
+ "epoch": 1.24,
12
+ "learning_rate": 9.980000000000001e-06,
13
+ "loss": 0.7181,
14
+ "step": 500
15
  },
16
  {
17
+ "epoch": 2.49,
18
+ "learning_rate": 8.891111111111111e-06,
19
+ "loss": 0.2045,
20
+ "step": 1000
 
 
 
21
  },
22
  {
23
+ "epoch": 2.49,
24
+ "eval_loss": 0.31939101219177246,
25
+ "eval_runtime": 852.4844,
26
+ "eval_samples_per_second": 5.865,
27
+ "eval_steps_per_second": 0.733,
28
+ "eval_wer": 16.16284610090529,
29
+ "step": 1000
30
  },
31
  {
32
+ "epoch": 3.73,
33
+ "learning_rate": 7.78e-06,
34
+ "loss": 0.1182,
35
+ "step": 1500
 
 
 
36
  },
37
  {
38
+ "epoch": 4.97,
39
+ "learning_rate": 6.668888888888889e-06,
40
+ "loss": 0.0652,
41
+ "step": 2000
42
  },
43
  {
44
+ "epoch": 4.97,
45
+ "eval_loss": 0.3425401449203491,
46
+ "eval_runtime": 853.9079,
47
+ "eval_samples_per_second": 5.855,
48
+ "eval_steps_per_second": 0.732,
49
+ "eval_wer": 16.367197840012707,
50
+ "step": 2000
51
  },
52
  {
53
+ "epoch": 6.22,
54
+ "learning_rate": 5.557777777777778e-06,
55
+ "loss": 0.0318,
56
+ "step": 2500
57
  },
58
  {
59
+ "epoch": 7.46,
60
+ "learning_rate": 4.446666666666667e-06,
61
+ "loss": 0.0167,
62
+ "step": 3000
 
 
 
63
  },
64
  {
65
+ "epoch": 7.46,
66
+ "eval_loss": 0.3914715647697449,
67
+ "eval_runtime": 851.1992,
68
+ "eval_samples_per_second": 5.874,
69
+ "eval_steps_per_second": 0.734,
70
+ "eval_wer": 15.818730478056011,
71
+ "step": 3000
72
  },
73
  {
74
+ "epoch": 8.71,
75
+ "learning_rate": 3.335555555555556e-06,
76
+ "loss": 0.0096,
77
+ "step": 3500
 
 
 
78
  },
79
  {
80
+ "epoch": 9.95,
81
+ "learning_rate": 2.2244444444444447e-06,
82
+ "loss": 0.0064,
83
+ "step": 4000
84
  },
85
  {
86
+ "epoch": 9.95,
87
+ "eval_loss": 0.41895967721939087,
88
+ "eval_runtime": 850.8744,
89
+ "eval_samples_per_second": 5.876,
90
+ "eval_steps_per_second": 0.735,
91
+ "eval_wer": 15.729789824765735,
92
+ "step": 4000
93
  },
94
  {
95
+ "epoch": 1.01,
96
+ "learning_rate": 5.790526315789474e-06,
97
+ "loss": 0.1798,
98
+ "step": 4500
99
  },
100
  {
101
+ "epoch": 2.02,
102
+ "learning_rate": 5.26421052631579e-06,
103
+ "loss": 0.1966,
104
+ "step": 5000
 
 
 
105
  },
106
  {
107
+ "epoch": 2.02,
108
+ "eval_loss": 0.32975926995277405,
109
+ "eval_runtime": 1015.8008,
110
+ "eval_samples_per_second": 4.922,
111
+ "eval_steps_per_second": 0.615,
112
+ "eval_wer": 15.088146540314467,
113
+ "step": 5000
114
  },
115
  {
116
+ "epoch": 3.03,
117
+ "learning_rate": 4.737894736842106e-06,
118
+ "loss": 0.1605,
119
+ "step": 5500
 
 
 
120
  },
121
  {
122
+ "epoch": 4.04,
123
+ "learning_rate": 4.211578947368422e-06,
124
+ "loss": 0.1912,
125
+ "step": 6000
126
  },
127
  {
128
+ "epoch": 4.04,
129
+ "eval_loss": 0.3265514671802521,
130
+ "eval_runtime": 1016.6509,
131
+ "eval_samples_per_second": 4.918,
132
+ "eval_steps_per_second": 0.615,
133
+ "eval_wer": 14.876383080099528,
134
+ "step": 6000
135
  },
136
  {
137
+ "epoch": 6.01,
138
+ "learning_rate": 3.685263157894737e-06,
139
+ "loss": 0.1355,
140
+ "step": 6500
141
  },
142
  {
143
+ "epoch": 7.02,
144
+ "learning_rate": 3.1600000000000002e-06,
145
+ "loss": 0.1008,
146
+ "step": 7000
147
+ },
148
+ {
149
+ "epoch": 7.02,
150
+ "eval_loss": 0.3261025547981262,
151
+ "eval_runtime": 1005.7569,
152
+ "eval_samples_per_second": 4.971,
153
+ "eval_steps_per_second": 0.621,
154
+ "eval_wer": 14.808618772830748,
155
+ "step": 7000
156
+ },
157
+ {
158
+ "epoch": 8.03,
159
+ "learning_rate": 2.633684210526316e-06,
160
+ "loss": 0.1092,
161
+ "step": 7500
162
+ },
163
+ {
164
+ "epoch": 9.04,
165
+ "learning_rate": 2.1073684210526317e-06,
166
+ "loss": 0.0899,
167
+ "step": 8000
168
+ },
169
+ {
170
+ "epoch": 9.04,
171
+ "eval_loss": 0.31958696246147156,
172
+ "eval_runtime": 1016.386,
173
+ "eval_samples_per_second": 4.919,
174
+ "eval_steps_per_second": 0.615,
175
+ "eval_wer": 14.648737360368468,
176
+ "step": 8000
177
+ },
178
+ {
179
+ "epoch": 11.01,
180
+ "learning_rate": 1.5810526315789477e-06,
181
+ "loss": 0.0683,
182
+ "step": 8500
183
+ },
184
+ {
185
+ "epoch": 12.02,
186
+ "learning_rate": 1.0547368421052632e-06,
187
+ "loss": 0.1126,
188
+ "step": 9000
189
+ },
190
+ {
191
+ "epoch": 12.02,
192
+ "eval_loss": 0.3282873332500458,
193
+ "eval_runtime": 1020.4433,
194
+ "eval_samples_per_second": 4.9,
195
+ "eval_steps_per_second": 0.612,
196
+ "eval_wer": 14.589443591508285,
197
+ "step": 9000
198
+ },
199
+ {
200
+ "epoch": 13.03,
201
+ "learning_rate": 5.284210526315789e-07,
202
+ "loss": 0.0853,
203
+ "step": 9500
204
+ },
205
+ {
206
+ "epoch": 14.04,
207
+ "learning_rate": 2.105263157894737e-09,
208
+ "loss": 0.1071,
209
+ "step": 10000
210
+ },
211
+ {
212
+ "epoch": 14.04,
213
+ "eval_loss": 0.30335742235183716,
214
+ "eval_runtime": 1026.6502,
215
+ "eval_samples_per_second": 4.87,
216
+ "eval_steps_per_second": 0.609,
217
+ "eval_wer": 14.535443909153475,
218
+ "step": 10000
219
  },
220
  {
221
+ "epoch": 14.04,
222
+ "step": 10000,
223
+ "total_flos": 3.699734092598477e+20,
224
+ "train_loss": 0.0768378963470459,
225
+ "train_runtime": 74057.892,
226
+ "train_samples_per_second": 17.284,
227
+ "train_steps_per_second": 0.135
228
  }
229
  ],
230
+ "max_steps": 10000,
231
  "num_train_epochs": 9223372036854775807,
232
+ "total_flos": 3.699734092598477e+20,
233
  "trial_name": null,
234
  "trial_params": null
235
  }