ihanif commited on
Commit
6f674a1
1 Parent(s): 4ede9f9

End of training

Browse files
.gitattributes CHANGED
@@ -32,3 +32,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
32
  *.zip filter=lfs diff=lfs merge=lfs -text
33
  *.zst filter=lfs diff=lfs merge=lfs -text
34
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
32
  *.zip filter=lfs diff=lfs merge=lfs -text
33
  *.zst filter=lfs diff=lfs merge=lfs -text
34
  *tfevents* filter=lfs diff=lfs merge=lfs -text
35
+ .run_speech_recognition_seq2seq_streaming.py.swp filter=lfs diff=lfs merge=lfs -text
.run_speech_recognition_seq2seq_streaming.py.swp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5afad038ca66e4a3fe2adc83255d2b1830295ec385663ae7117e72f55f25982a
3
+ size 20480
all_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
- "epoch": 18.52,
3
- "eval_loss": 1.1797882318496704,
4
- "eval_runtime": 450.6771,
5
- "eval_samples_per_second": 1.136,
6
  "eval_steps_per_second": 0.142,
7
- "eval_wer": 57.87681598062954,
8
- "train_loss": 0.0056979965269565586,
9
- "train_runtime": 579.6036,
10
- "train_samples_per_second": 13.803,
11
- "train_steps_per_second": 0.863
12
  }
 
1
  {
2
+ "epoch": 22.22,
3
+ "eval_loss": 1.2309296131134033,
4
+ "eval_runtime": 450.2608,
5
+ "eval_samples_per_second": 1.137,
6
  "eval_steps_per_second": 0.142,
7
+ "eval_wer": 56.651029055690074,
8
+ "train_loss": 0.001749273296445608,
9
+ "train_runtime": 576.5843,
10
+ "train_samples_per_second": 16.65,
11
+ "train_steps_per_second": 1.041
12
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 18.52,
3
- "eval_loss": 1.1797882318496704,
4
- "eval_runtime": 450.6771,
5
- "eval_samples_per_second": 1.136,
6
  "eval_steps_per_second": 0.142,
7
- "eval_wer": 57.87681598062954
8
  }
 
1
  {
2
+ "epoch": 22.22,
3
+ "eval_loss": 1.2309296131134033,
4
+ "eval_runtime": 450.2608,
5
+ "eval_samples_per_second": 1.137,
6
  "eval_steps_per_second": 0.142,
7
+ "eval_wer": 56.651029055690074
8
  }
runs/Dec16_18-03-10_129-146-104-29/events.out.tfevents.1671214896.129-146-104-29.137983.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ba67a7b84b79d789629e06628df81253985de536e93a6637efe8768b88cf00d
3
+ size 358
train_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "epoch": 18.52,
3
- "train_loss": 0.0056979965269565586,
4
- "train_runtime": 579.6036,
5
- "train_samples_per_second": 13.803,
6
- "train_steps_per_second": 0.863
7
  }
 
1
  {
2
+ "epoch": 22.22,
3
+ "train_loss": 0.001749273296445608,
4
+ "train_runtime": 576.5843,
5
+ "train_samples_per_second": 16.65,
6
+ "train_steps_per_second": 1.041
7
  }
trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "best_metric": 57.87681598062954,
3
- "best_model_checkpoint": "./checkpoint-500",
4
- "epoch": 18.51851851851852,
5
- "global_step": 500,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -245,18 +245,87 @@
245
  "step": 500
246
  },
247
  {
248
- "epoch": 18.52,
249
- "step": 500,
250
- "total_flos": 2.30348866535424e+18,
251
- "train_loss": 0.0056979965269565586,
252
- "train_runtime": 579.6036,
253
- "train_samples_per_second": 13.803,
254
- "train_steps_per_second": 0.863
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
255
  }
256
  ],
257
- "max_steps": 500,
258
- "num_train_epochs": 19,
259
- "total_flos": 2.30348866535424e+18,
260
  "trial_name": null,
261
  "trial_params": null
262
  }
 
1
  {
2
+ "best_metric": 56.651029055690074,
3
+ "best_model_checkpoint": "./checkpoint-600",
4
+ "epoch": 22.22222222222222,
5
+ "global_step": 600,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
245
  "step": 500
246
  },
247
  {
248
+ "epoch": 18.89,
249
+ "learning_rate": 9.4e-06,
250
+ "loss": 0.019,
251
+ "step": 510
252
+ },
253
+ {
254
+ "epoch": 19.26,
255
+ "learning_rate": 8.400000000000001e-06,
256
+ "loss": 0.021,
257
+ "step": 520
258
+ },
259
+ {
260
+ "epoch": 19.63,
261
+ "learning_rate": 7.4e-06,
262
+ "loss": 0.0139,
263
+ "step": 530
264
+ },
265
+ {
266
+ "epoch": 20.0,
267
+ "learning_rate": 6.4000000000000006e-06,
268
+ "loss": 0.013,
269
+ "step": 540
270
+ },
271
+ {
272
+ "epoch": 20.37,
273
+ "learning_rate": 5.400000000000001e-06,
274
+ "loss": 0.007,
275
+ "step": 550
276
+ },
277
+ {
278
+ "epoch": 20.74,
279
+ "learning_rate": 4.4e-06,
280
+ "loss": 0.0082,
281
+ "step": 560
282
+ },
283
+ {
284
+ "epoch": 21.11,
285
+ "learning_rate": 3.4000000000000005e-06,
286
+ "loss": 0.009,
287
+ "step": 570
288
+ },
289
+ {
290
+ "epoch": 21.48,
291
+ "learning_rate": 2.4000000000000003e-06,
292
+ "loss": 0.0045,
293
+ "step": 580
294
+ },
295
+ {
296
+ "epoch": 21.85,
297
+ "learning_rate": 1.4000000000000001e-06,
298
+ "loss": 0.0049,
299
+ "step": 590
300
+ },
301
+ {
302
+ "epoch": 22.22,
303
+ "learning_rate": 4.0000000000000003e-07,
304
+ "loss": 0.0045,
305
+ "step": 600
306
+ },
307
+ {
308
+ "epoch": 22.22,
309
+ "eval_loss": 1.2309296131134033,
310
+ "eval_runtime": 449.2432,
311
+ "eval_samples_per_second": 1.14,
312
+ "eval_steps_per_second": 0.142,
313
+ "eval_wer": 56.651029055690074,
314
+ "step": 600
315
+ },
316
+ {
317
+ "epoch": 22.22,
318
+ "step": 600,
319
+ "total_flos": 2.76407096426496e+18,
320
+ "train_loss": 0.001749273296445608,
321
+ "train_runtime": 576.5843,
322
+ "train_samples_per_second": 16.65,
323
+ "train_steps_per_second": 1.041
324
  }
325
  ],
326
+ "max_steps": 600,
327
+ "num_train_epochs": 23,
328
+ "total_flos": 2.76407096426496e+18,
329
  "trial_name": null,
330
  "trial_params": null
331
  }