mprzibilla commited on
Commit
b02d155
1 Parent(s): 36fd286

Training in progress, epoch 15

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8784c6ab43edf317cbf72cd41edf62484b74352d6d7d83acc2f051f7a65008b2
3
  size 721661957
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01d608eb5c5bb1e5a04194d9459fad8efe4105639d7ec60f4793e908bee01ded
3
  size 721661957
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fe139ad8af6b60c1a91b2eaa1256fad6cc9d9968a1f8dc94872c4fb95570f04c
3
  size 377646433
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2820bc90593d7e6a12e93895fccf5a57a04083cda0f9618714291c06c24172f6
3
  size 377646433
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:77449eee0e37c3a473773336c4dbcfe7c14eecc740f7fbaa6436e6669f2d6fbd
3
  size 14639
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a906ecbc561abf50620a59de5a6f7c9069c6d34071327af28d703780de77d2c
3
  size 14639
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4cbcf41191e28d7739e96f26098069b589cab9c332419d792a7590cdd6570afd
3
  size 557
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a123fd4a1fb530b6f54c935524d6597bb50eaf008fb8e8a85e8a0213174b1e68
3
  size 557
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0d68fe7515f9ec06ccc7d9a5fb73e55e1ddd580d17c52369ab12a4688fdb1961
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ffef3b2283afa05a6f5f6370d44f20f10535bd3da41245a94669aed13c81edc8
3
  size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 14.0,
5
- "global_step": 9380,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -244,11 +244,28 @@
244
  "eval_samples_per_second": 26.378,
245
  "eval_steps_per_second": 3.37,
246
  "step": 9380
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
247
  }
248
  ],
249
  "max_steps": 10050,
250
  "num_train_epochs": 15,
251
- "total_flos": 6.969087095470326e+18,
252
  "trial_name": null,
253
  "trial_params": null
254
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 15.0,
5
+ "global_step": 10050,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
244
  "eval_samples_per_second": 26.378,
245
  "eval_steps_per_second": 3.37,
246
  "step": 9380
247
+ },
248
+ {
249
+ "epoch": 15.0,
250
+ "learning_rate": 8.378718056137412e-08,
251
+ "loss": 0.054,
252
+ "step": 10050
253
+ },
254
+ {
255
+ "epoch": 15.0,
256
+ "eval_cer": 0.48787878787878786,
257
+ "eval_loss": 3.622342824935913,
258
+ "eval_new_wer": 0.19444444444444445,
259
+ "eval_old_wer": 0.8833333333333333,
260
+ "eval_runtime": 6.8734,
261
+ "eval_samples_per_second": 26.188,
262
+ "eval_steps_per_second": 3.346,
263
+ "step": 10050
264
  }
265
  ],
266
  "max_steps": 10050,
267
  "num_train_epochs": 15,
268
+ "total_flos": 7.467056434063227e+18,
269
  "trial_name": null,
270
  "trial_params": null
271
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fe139ad8af6b60c1a91b2eaa1256fad6cc9d9968a1f8dc94872c4fb95570f04c
3
  size 377646433
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2820bc90593d7e6a12e93895fccf5a57a04083cda0f9618714291c06c24172f6
3
  size 377646433