mprzibilla commited on
Commit
0072de9
1 Parent(s): af77d5d

Training in progress, epoch 15

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3708f0232add0b440707331fbfc234ae93e774e96ceb137682e09c3db9f76cc4
3
  size 721661957
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:286d22860ee8c90cae4c5ef4722e8fc173505dfd9ba17d2af095df690485fe2c
3
  size 721661957
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:143df86c3f9bb95948dbe505f344eafcf3df2e17b8ab7775170f907fe290411d
3
  size 377646433
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8cbd29fe88aee2ca43aa0b0cb29780a1b7300d7e76435cf1929e2d61d4cc58aa
3
  size 377646433
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:37826454889cc005af1c4a5ffcdd7fcc45d5f29df3e5ea3ad78cccc90d3f06fb
3
  size 14639
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1069b7ffb3af89aa9f6f909347d8a8ba457c5127aa1618d6ba97e41c8338d5f
3
  size 14639
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f0ff467205290e05f676b0bf254ddb940e84b6639dc95eeadff858daeeb3c5af
3
  size 557
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b541a8e2a0672f656c80d20ec8a7263b01c69cbf1cc4017e763f43a73a46f5e3
3
  size 557
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8c0bc953e7af64bbf30cf0c251471e6877e9e05200f974ad209e3be5f909477b
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b29d56619f19dd624dc3d9ce779248fcca781dca28f83547cd64f3f5a24ff43b
3
  size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 14.0,
5
- "global_step": 59780,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -244,11 +244,28 @@
244
  "eval_samples_per_second": 23.774,
245
  "eval_steps_per_second": 3.057,
246
  "step": 59780
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
247
  }
248
  ],
249
  "max_steps": 64050,
250
  "num_train_epochs": 15,
251
- "total_flos": 4.7376645895196344e+19,
252
  "trial_name": null,
253
  "trial_params": null
254
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 15.0,
5
+ "global_step": 64050,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
244
  "eval_samples_per_second": 23.774,
245
  "eval_steps_per_second": 3.057,
246
  "step": 59780
247
+ },
248
+ {
249
+ "epoch": 15.0,
250
+ "learning_rate": 4.930318169865895e-08,
251
+ "loss": 0.0259,
252
+ "step": 64050
253
+ },
254
+ {
255
+ "epoch": 15.0,
256
+ "eval_cer": 0.6311688311688312,
257
+ "eval_loss": 4.495311260223389,
258
+ "eval_new_wer": 0.3047619047619048,
259
+ "eval_old_wer": 1.0,
260
+ "eval_runtime": 8.6991,
261
+ "eval_samples_per_second": 24.14,
262
+ "eval_steps_per_second": 3.104,
263
+ "step": 64050
264
  }
265
  ],
266
  "max_steps": 64050,
267
  "num_train_epochs": 15,
268
+ "total_flos": 5.076674134512955e+19,
269
  "trial_name": null,
270
  "trial_params": null
271
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:143df86c3f9bb95948dbe505f344eafcf3df2e17b8ab7775170f907fe290411d
3
  size 377646433
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8cbd29fe88aee2ca43aa0b0cb29780a1b7300d7e76435cf1929e2d61d4cc58aa
3
  size 377646433