mprzibilla commited on
Commit
0c7ea71
1 Parent(s): c34d3e6

Training in progress, step 21350

Browse files
config.json CHANGED
@@ -110,7 +110,7 @@
110
  1
111
  ],
112
  "torch_dtype": "float32",
113
- "transformers_version": "4.18.0",
114
  "use_weighted_layer_sum": false,
115
  "vocab_size": 28,
116
  "xvector_output_dim": 512
 
110
  1
111
  ],
112
  "torch_dtype": "float32",
113
+ "transformers_version": "4.23.1",
114
  "use_weighted_layer_sum": false,
115
  "vocab_size": 28,
116
  "xvector_output_dim": 512
last-checkpoint/config.json CHANGED
@@ -110,7 +110,7 @@
110
  1
111
  ],
112
  "torch_dtype": "float32",
113
- "transformers_version": "4.18.0",
114
  "use_weighted_layer_sum": false,
115
  "vocab_size": 28,
116
  "xvector_output_dim": 512
 
110
  1
111
  ],
112
  "torch_dtype": "float32",
113
+ "transformers_version": "4.23.1",
114
  "use_weighted_layer_sum": false,
115
  "vocab_size": 28,
116
  "xvector_output_dim": 512
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fcc7857919e09b77e372558e040f9eb549afe29dd03060a5523a7eb842f9ddbf
3
- size 174303
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c7968b8efd13d5fc708b8d575bdfacce3f6faac04d2a82a6681be7767cb3a47
3
+ size 721661957
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b522e60d0d2a6ee27af3602669b1014da231da2f41574acaad118912eceeb40a
3
- size 377644503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23c29e7e62821dd9ebdecb0f80999e35b88a4c33b2f765c44a4a3067dd06ef8a
3
+ size 377646433
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b119c6ba94045170ce909d97437f8a62214d60f57d9820329c8e249ad1d0f477
3
- size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a815883a2570166bd8681954c208cd0afd701a2550fb682192af67da1655896c
3
+ size 14639
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8a5beb41d03d0282f86de0df3b3801db507a048b5eb0500763cfc03e40601417
3
- size 559
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:431969896cbea52c0fd9fb08d326480e121ae77403d61e7102d4920fa4fa6518
3
+ size 557
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:27135a9065f7161bbce1a83a7e57aa28ecc4c06a7e536eb74226e435b074bac0
3
- size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0af760cdb84b96d47402463fdc44064dac492fd9b85975a42428ed9c5f980ff1
3
+ size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,176 +1,32 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 100.0,
5
- "global_step": 341600,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
  "epoch": 10.0,
12
- "learning_rate": 9.474208061136448e-05,
13
- "loss": 13.2913,
14
- "step": 34160
15
  },
16
  {
17
  "epoch": 10.0,
18
- "eval_cer": 0.9688311688311688,
19
- "eval_loss": 3.2334227561950684,
20
- "eval_runtime": 1.6446,
21
- "eval_samples_per_second": 127.692,
22
- "eval_steps_per_second": 16.418,
23
- "eval_wer": 1.0,
24
- "step": 34160
25
- },
26
- {
27
- "epoch": 20.0,
28
- "learning_rate": 8.421977073832122e-05,
29
- "loss": 2.7732,
30
- "step": 68320
31
- },
32
- {
33
- "epoch": 20.0,
34
- "eval_cer": 0.9541125541125541,
35
- "eval_loss": 3.2456371784210205,
36
- "eval_runtime": 1.138,
37
- "eval_samples_per_second": 184.54,
38
- "eval_steps_per_second": 23.727,
39
- "eval_wer": 1.0,
40
- "step": 68320
41
- },
42
- {
43
- "epoch": 30.0,
44
- "learning_rate": 7.369746086527796e-05,
45
- "loss": 2.6976,
46
- "step": 102480
47
- },
48
- {
49
- "epoch": 30.0,
50
- "eval_cer": 0.9558441558441558,
51
- "eval_loss": 3.2558517456054688,
52
- "eval_runtime": 1.1494,
53
- "eval_samples_per_second": 182.707,
54
- "eval_steps_per_second": 23.491,
55
- "eval_wer": 1.0,
56
- "step": 102480
57
- },
58
- {
59
- "epoch": 40.0,
60
- "learning_rate": 6.317545913965241e-05,
61
- "loss": 2.6683,
62
- "step": 136640
63
- },
64
- {
65
- "epoch": 40.0,
66
- "eval_cer": 0.9532467532467532,
67
- "eval_loss": 3.264427661895752,
68
- "eval_runtime": 1.1405,
69
- "eval_samples_per_second": 184.136,
70
- "eval_steps_per_second": 23.675,
71
- "eval_wer": 1.0,
72
- "step": 136640
73
- },
74
- {
75
- "epoch": 50.0,
76
- "learning_rate": 5.2653457414026874e-05,
77
- "loss": 2.6525,
78
- "step": 170800
79
- },
80
- {
81
- "epoch": 50.0,
82
- "eval_cer": 0.9549783549783549,
83
- "eval_loss": 3.274503469467163,
84
- "eval_runtime": 1.1464,
85
- "eval_samples_per_second": 183.187,
86
- "eval_steps_per_second": 23.553,
87
- "eval_wer": 1.0,
88
- "step": 170800
89
- },
90
- {
91
- "epoch": 60.0,
92
- "learning_rate": 4.213176383581906e-05,
93
- "loss": 2.6429,
94
- "step": 204960
95
- },
96
- {
97
- "epoch": 60.0,
98
- "eval_cer": 0.9532467532467532,
99
- "eval_loss": 3.263571262359619,
100
- "eval_runtime": 1.1355,
101
- "eval_samples_per_second": 184.948,
102
- "eval_steps_per_second": 23.779,
103
- "eval_wer": 1.0,
104
- "step": 204960
105
- },
106
- {
107
- "epoch": 70.0,
108
- "learning_rate": 3.160976211019352e-05,
109
- "loss": 2.6365,
110
- "step": 239120
111
- },
112
- {
113
- "epoch": 70.0,
114
- "eval_cer": 0.9532467532467532,
115
- "eval_loss": 3.2685256004333496,
116
- "eval_runtime": 1.1494,
117
- "eval_samples_per_second": 182.699,
118
- "eval_steps_per_second": 23.49,
119
- "eval_wer": 1.0,
120
- "step": 239120
121
- },
122
- {
123
- "epoch": 80.0,
124
- "learning_rate": 2.108776038456798e-05,
125
- "loss": 2.6334,
126
- "step": 273280
127
- },
128
- {
129
- "epoch": 80.0,
130
- "eval_cer": 0.9601731601731601,
131
- "eval_loss": 3.2787115573883057,
132
- "eval_runtime": 1.1465,
133
- "eval_samples_per_second": 183.166,
134
- "eval_steps_per_second": 23.55,
135
- "eval_wer": 1.0,
136
- "step": 273280
137
- },
138
- {
139
- "epoch": 90.0,
140
- "learning_rate": 1.0565450511524715e-05,
141
- "loss": 2.6303,
142
- "step": 307440
143
- },
144
- {
145
- "epoch": 90.0,
146
- "eval_cer": 0.9601731601731601,
147
- "eval_loss": 3.2688238620758057,
148
- "eval_runtime": 1.148,
149
- "eval_samples_per_second": 182.93,
150
- "eval_steps_per_second": 23.52,
151
- "eval_wer": 1.0,
152
- "step": 307440
153
- },
154
- {
155
- "epoch": 100.0,
156
- "learning_rate": 4.3448785899174166e-08,
157
- "loss": 2.63,
158
- "step": 341600
159
- },
160
- {
161
- "epoch": 100.0,
162
- "eval_cer": 0.9619047619047619,
163
- "eval_loss": 3.274722099304199,
164
- "eval_runtime": 1.1513,
165
- "eval_samples_per_second": 182.407,
166
- "eval_steps_per_second": 23.452,
167
- "eval_wer": 1.0,
168
- "step": 341600
169
  }
170
  ],
171
- "max_steps": 341600,
172
  "num_train_epochs": 100,
173
- "total_flos": 3.2456870768043944e+20,
174
  "trial_name": null,
175
  "trial_params": null
176
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 10.0,
5
+ "global_step": 21350,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
  "epoch": 10.0,
12
+ "learning_rate": 9.474226549981512e-05,
13
+ "loss": 2.5212,
14
+ "step": 21350
15
  },
16
  {
17
  "epoch": 10.0,
18
+ "eval_cer": 0.587012987012987,
19
+ "eval_loss": 2.120373010635376,
20
+ "eval_runtime": 8.074,
21
+ "eval_samples_per_second": 26.009,
22
+ "eval_steps_per_second": 3.344,
23
+ "eval_wer": 0.9952380952380953,
24
+ "step": 21350
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
25
  }
26
  ],
27
+ "max_steps": 213500,
28
  "num_train_epochs": 100,
29
+ "total_flos": 3.2799001703543853e+19,
30
  "trial_name": null,
31
  "trial_params": null
32
  }
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:594585b932be751fb4c7e99db27752222da7b2cc805eb1149ec1dc9adf89f864
3
- size 3119
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e48be025d9de6e427cd8dae3eec60c35384929891f8fc67a0b488ae5ade59c15
3
+ size 3451
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b522e60d0d2a6ee27af3602669b1014da231da2f41574acaad118912eceeb40a
3
- size 377644503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23c29e7e62821dd9ebdecb0f80999e35b88a4c33b2f765c44a4a3067dd06ef8a
3
+ size 377646433
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:594585b932be751fb4c7e99db27752222da7b2cc805eb1149ec1dc9adf89f864
3
- size 3119
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e48be025d9de6e427cd8dae3eec60c35384929891f8fc67a0b488ae5ade59c15
3
+ size 3451