mprzibilla commited on
Commit
995530e
1 Parent(s): 1428a81

Training in progress, epoch 15

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:02c3032c97cfb406e3df1997fc82b235fdf4b343d9731893321aff309d3ec39b
3
  size 721661957
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:62572fe8c3253ef89a5879075cee362f139dc359c9f4d288ef7ee5a44f04f2ca
3
  size 721661957
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e03198156019d4a4cc89c394475471f08334d5aa6d515bea3d95adfd769ee04d
3
  size 377646433
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f5c24802d2ddf25034479a6f5d742fae095bdf7e4f8c9d98298c81c7ea86c28
3
  size 377646433
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4b582a61fc9db0b4c3ab7f9c6bcc7ec92bd6b554c9167e6aaf8ccf981d726604
3
- size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:878bc5201ec12a3758f64aeeda9034b9a01212beb81745ad60e9908a6606fc4f
3
+ size 14639
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:812ba51647b28422373531c50c6c75a733798cf99f711de0c49157a2c51b5905
3
  size 557
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3efb0dbe6e7100aa99d1d61d828b8dff6a4d645e343bc99b3a57b3415b8240db
3
  size 557
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9e23e7308fe04ea4571d59a06bafc7864cde86f32c2c2dfcbb4d0fa8be4a954b
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9378d54f67fa75f090c07a0b880b082c7ac2926177e9eb5704ca2e9e1108531b
3
  size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 14.0,
5
- "global_step": 59780,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -244,11 +244,28 @@
244
  "eval_samples_per_second": 24.418,
245
  "eval_steps_per_second": 3.139,
246
  "step": 59780
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
247
  }
248
  ],
249
  "max_steps": 64050,
250
  "num_train_epochs": 15,
251
- "total_flos": 4.529033204206461e+19,
252
  "trial_name": null,
253
  "trial_params": null
254
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 15.0,
5
+ "global_step": 64050,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
244
  "eval_samples_per_second": 24.418,
245
  "eval_steps_per_second": 3.139,
246
  "step": 59780
247
+ },
248
+ {
249
+ "epoch": 15.0,
250
+ "learning_rate": 4.7659742308703654e-08,
251
+ "loss": 0.0469,
252
+ "step": 64050
253
+ },
254
+ {
255
+ "epoch": 15.0,
256
+ "eval_cer": 0.09004329004329005,
257
+ "eval_loss": 0.6429840922355652,
258
+ "eval_new_wer": 0.09523809523809523,
259
+ "eval_old_wer": 0.14285714285714285,
260
+ "eval_runtime": 8.622,
261
+ "eval_samples_per_second": 24.356,
262
+ "eval_steps_per_second": 3.132,
263
+ "step": 64050
264
  }
265
  ],
266
  "max_steps": 64050,
267
  "num_train_epochs": 15,
268
+ "total_flos": 4.852750717448731e+19,
269
  "trial_name": null,
270
  "trial_params": null
271
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e03198156019d4a4cc89c394475471f08334d5aa6d515bea3d95adfd769ee04d
3
  size 377646433
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f5c24802d2ddf25034479a6f5d742fae095bdf7e4f8c9d98298c81c7ea86c28
3
  size 377646433