marcel commited on
Commit
c00c85b
1 Parent(s): 32419ff
Files changed (4) hide show
  1. optimizer.pt +1 -1
  2. pytorch_model.bin +1 -1
  3. scheduler.pt +1 -1
  4. trainer_state.json +31 -3
optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:06ec0667d993c3f120c1d8a82b4485dc0f1e1f05f231fae102da6dcf82e9d1f4
3
  size 2490339591
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:415f789cebf94dc975e2af37856a750f6a78c4e12af0b81cbeef753992d90419
3
  size 2490339591
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b4fcc26137a3ca289aeb72befc5b018e20b28e0e43aa434fa2a2467b52372e02
3
  size 1262065048
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0dc27a79ad93085f47b570fdaf3825b555caa80cf07cabe1ba820b1fd6247b8a
3
  size 1262065048
scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bea1393d7c8716a158a855861ef15a9d29632d763274abd05c73238c435e73b6
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69fca0da0f8fa986f151fcf8b07e0888193c079c13d2d8004abe9580c45c5584
3
  size 623
trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 2.034587995930824,
5
- "global_step": 2000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -76,11 +76,39 @@
76
  "eval_samples_per_second": 7.991,
77
  "eval_wer": 0.42106879606879605,
78
  "step": 2000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
79
  }
80
  ],
81
  "max_steps": 29490,
82
  "num_train_epochs": 30,
83
- "total_flos": 1.1113863503200174e+19,
84
  "trial_name": null,
85
  "trial_params": null
86
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 2.8484231943031535,
5
+ "global_step": 2800,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
76
  "eval_samples_per_second": 7.991,
77
  "eval_wer": 0.42106879606879605,
78
  "step": 2000
79
+ },
80
+ {
81
+ "epoch": 2.44,
82
+ "learning_rate": 0.0002803380476026216,
83
+ "loss": 0.2606,
84
+ "step": 2400
85
+ },
86
+ {
87
+ "epoch": 2.44,
88
+ "eval_loss": 0.39613404870033264,
89
+ "eval_runtime": 233.8224,
90
+ "eval_samples_per_second": 8.002,
91
+ "eval_wer": 0.4057125307125307,
92
+ "step": 2400
93
+ },
94
+ {
95
+ "epoch": 2.85,
96
+ "learning_rate": 0.0002761986892031735,
97
+ "loss": 0.2475,
98
+ "step": 2800
99
+ },
100
+ {
101
+ "epoch": 2.85,
102
+ "eval_loss": 0.3680589497089386,
103
+ "eval_runtime": 235.255,
104
+ "eval_samples_per_second": 7.953,
105
+ "eval_wer": 0.39256756756756755,
106
+ "step": 2800
107
  }
108
  ],
109
  "max_steps": 29490,
110
  "num_train_epochs": 30,
111
+ "total_flos": 1.5548475390462444e+19,
112
  "trial_name": null,
113
  "trial_params": null
114
  }