mprzibilla commited on
Commit
652bfe7
1 Parent(s): 1cd0b48

Training in progress, epoch 15

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:300ea7a2c3812353c9e5340601b0f6d1afe800849d12ee4268749e5c8e3e18fa
3
  size 174443
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3b2e35834074f19bc5222d3c8af123732ecaf310f7c9f23dccd514a0fefc4c57
3
  size 174443
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3dfaf09fe4afaa24abb2476b663651a08931ea7492098946dd00b2881087460a
3
  size 377646433
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9fdd83bce0be94c1d45bb977937e9084dac2cb76e797eac4044daa3dc8639b22
3
  size 377646433
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4ed915321fff0d4cda44d8fdad5f1f38cdcf6d76811c32f0a5ce0b9751767779
3
  size 14639
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:63d5ccf1b0ffdd4638e6e2647e36a4f32f89f322ea80cdd67e65f7a7c51f6a0c
3
  size 14639
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:70bf93fdfba664304e5d33e228d504d5cad19a40c638afc0ec24a21d28f9ae8c
3
  size 557
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:614dcd144644e40eeba8333744c7822a05c774de62a1e066c6cfdf0f6212d9b6
3
  size 557
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8c0bc953e7af64bbf30cf0c251471e6877e9e05200f974ad209e3be5f909477b
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b29d56619f19dd624dc3d9ce779248fcca781dca28f83547cd64f3f5a24ff43b
3
  size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 14.0,
5
- "global_step": 59780,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -244,11 +244,28 @@
244
  "eval_samples_per_second": 24.363,
245
  "eval_steps_per_second": 3.132,
246
  "step": 59780
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
247
  }
248
  ],
249
  "max_steps": 64050,
250
  "num_train_epochs": 15,
251
- "total_flos": 4.740687154830613e+19,
252
  "trial_name": null,
253
  "trial_params": null
254
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 15.0,
5
+ "global_step": 64050,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
244
  "eval_samples_per_second": 24.363,
245
  "eval_steps_per_second": 3.132,
246
  "step": 59780
247
+ },
248
+ {
249
+ "epoch": 15.0,
250
+ "learning_rate": 4.930318169865895e-08,
251
+ "loss": 2.8106,
252
+ "step": 64050
253
+ },
254
+ {
255
+ "epoch": 15.0,
256
+ "eval_cer": 0.9593073593073593,
257
+ "eval_loss": 3.131213426589966,
258
+ "eval_new_wer": 0.9333333333333333,
259
+ "eval_old_wer": 1.0,
260
+ "eval_runtime": 8.5832,
261
+ "eval_samples_per_second": 24.466,
262
+ "eval_steps_per_second": 3.146,
263
+ "step": 64050
264
  }
265
  ],
266
  "max_steps": 64050,
267
  "num_train_epochs": 15,
268
+ "total_flos": 5.079400634281409e+19,
269
  "trial_name": null,
270
  "trial_params": null
271
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3dfaf09fe4afaa24abb2476b663651a08931ea7492098946dd00b2881087460a
3
  size 377646433
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9fdd83bce0be94c1d45bb977937e9084dac2cb76e797eac4044daa3dc8639b22
3
  size 377646433