mprzibilla commited on
Commit
774ab26
·
1 Parent(s): f69456c

Training in progress, step 6160

Browse files
config.json CHANGED
@@ -110,7 +110,7 @@
110
  1
111
  ],
112
  "torch_dtype": "float32",
113
- "transformers_version": "4.18.0",
114
  "use_weighted_layer_sum": false,
115
  "vocab_size": 27,
116
  "xvector_output_dim": 512
 
110
  1
111
  ],
112
  "torch_dtype": "float32",
113
+ "transformers_version": "4.23.1",
114
  "use_weighted_layer_sum": false,
115
  "vocab_size": 27,
116
  "xvector_output_dim": 512
last-checkpoint/config.json CHANGED
@@ -110,7 +110,7 @@
110
  1
111
  ],
112
  "torch_dtype": "float32",
113
- "transformers_version": "4.18.0",
114
  "use_weighted_layer_sum": false,
115
  "vocab_size": 27,
116
  "xvector_output_dim": 512
 
110
  1
111
  ],
112
  "torch_dtype": "float32",
113
+ "transformers_version": "4.23.1",
114
  "use_weighted_layer_sum": false,
115
  "vocab_size": 27,
116
  "xvector_output_dim": 512
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:91b496b77db0775d4aafe63ebf99bb48b4cedc2b148375ade0078f50c49fcc12
3
- size 168159
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cec9875bd026091efa36e8010d350104fd0a4d2a4764c3c36ceadcb6052a0c39
3
+ size 721655813
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ac76cdc6a11567deba22d2bf5690104a29bb9409be961b2f7cc85ec601ed2faf
3
- size 377641431
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a272e9147c0ac341d1a851b4f9beb9ad6e2a45b5ad4099cbb0bfb70cfe100965
3
+ size 377643361
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bbf5cf665edebc10f59a508b1bdd4459e2986107eff89494df9748ccc5e92d22
3
- size 14567
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:617dd7671016dca2a947f53be356990669bafa6ea2f783a55f6f3a1236b37a0b
3
+ size 14575
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:87eba8509565f31935d4802d6fd893f9a52221dec1363e87afb68f2247d77ad4
3
- size 559
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b613b2755a27abb572474750570fb952279e467c6ae92352953cf4de82eeaee
3
+ size 557
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e0bf0b5bd1d17ed1b58127b096eff11d292865966f32e83e2cd2210f9b28d40c
3
- size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3970e66b4828758eb5d9ec8312235775ae992b288b8e94eeb891496be72cd0a5
3
+ size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,176 +1,32 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 250.0,
5
- "global_step": 123250,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
- "epoch": 25.0,
12
- "learning_rate": 9.474412407761683e-05,
13
- "loss": 19.1039,
14
- "step": 12325
15
  },
16
  {
17
- "epoch": 25.0,
18
- "eval_cer": 0.9757575757575757,
19
- "eval_loss": 3.695141077041626,
20
- "eval_runtime": 1.0205,
21
- "eval_samples_per_second": 205.79,
22
- "eval_steps_per_second": 26.459,
23
- "eval_wer": 1.0,
24
- "step": 12325
25
- },
26
- {
27
- "epoch": 50.0,
28
- "learning_rate": 8.422041541404757e-05,
29
- "loss": 2.7071,
30
- "step": 24650
31
- },
32
- {
33
- "epoch": 50.0,
34
- "eval_cer": 0.9341991341991343,
35
- "eval_loss": 3.8789684772491455,
36
- "eval_runtime": 1.0032,
37
- "eval_samples_per_second": 209.335,
38
- "eval_steps_per_second": 26.914,
39
- "eval_wer": 1.0,
40
- "step": 24650
41
- },
42
- {
43
- "epoch": 75.0,
44
- "learning_rate": 7.369841486745012e-05,
45
- "loss": 2.5758,
46
- "step": 36975
47
- },
48
- {
49
- "epoch": 75.0,
50
- "eval_cer": 0.9125541125541126,
51
- "eval_loss": 3.856503963470459,
52
- "eval_runtime": 0.9967,
53
- "eval_samples_per_second": 210.695,
54
- "eval_steps_per_second": 27.089,
55
- "eval_wer": 1.0,
56
- "step": 36975
57
- },
58
- {
59
- "epoch": 100.0,
60
- "learning_rate": 6.317726837933862e-05,
61
- "loss": 2.5155,
62
- "step": 49300
63
- },
64
- {
65
- "epoch": 100.0,
66
- "eval_cer": 0.9168831168831169,
67
- "eval_loss": 3.8677046298980713,
68
- "eval_runtime": 1.0011,
69
- "eval_samples_per_second": 209.777,
70
- "eval_steps_per_second": 26.971,
71
- "eval_wer": 1.0,
72
- "step": 49300
73
- },
74
- {
75
- "epoch": 125.0,
76
- "learning_rate": 5.2655267832741184e-05,
77
- "loss": 2.4801,
78
- "step": 61625
79
- },
80
- {
81
- "epoch": 125.0,
82
- "eval_cer": 0.9168831168831169,
83
- "eval_loss": 3.8714091777801514,
84
- "eval_runtime": 1.0139,
85
- "eval_samples_per_second": 207.112,
86
- "eval_steps_per_second": 26.629,
87
- "eval_wer": 1.0,
88
- "step": 61625
89
- },
90
- {
91
- "epoch": 150.0,
92
- "learning_rate": 4.213241322765783e-05,
93
- "loss": 2.4591,
94
- "step": 73950
95
- },
96
- {
97
- "epoch": 150.0,
98
- "eval_cer": 0.922943722943723,
99
- "eval_loss": 3.857038736343384,
100
- "eval_runtime": 1.0003,
101
- "eval_samples_per_second": 209.939,
102
- "eval_steps_per_second": 26.992,
103
- "eval_wer": 1.0,
104
- "step": 73950
105
- },
106
- {
107
- "epoch": 175.0,
108
- "learning_rate": 3.16104126810604e-05,
109
- "loss": 2.4435,
110
- "step": 86275
111
- },
112
- {
113
- "epoch": 175.0,
114
- "eval_cer": 0.9125541125541126,
115
- "eval_loss": 3.8484246730804443,
116
- "eval_runtime": 0.9998,
117
- "eval_samples_per_second": 210.042,
118
- "eval_steps_per_second": 27.005,
119
- "eval_wer": 1.0,
120
- "step": 86275
121
- },
122
- {
123
- "epoch": 200.0,
124
- "learning_rate": 2.108841213446297e-05,
125
- "loss": 2.4329,
126
- "step": 98600
127
- },
128
- {
129
- "epoch": 200.0,
130
- "eval_cer": 0.9125541125541126,
131
- "eval_loss": 3.83984637260437,
132
- "eval_runtime": 1.0007,
133
- "eval_samples_per_second": 209.858,
134
- "eval_steps_per_second": 26.982,
135
- "eval_wer": 1.0,
136
- "step": 98600
137
- },
138
- {
139
- "epoch": 225.0,
140
- "learning_rate": 1.0565557529379612e-05,
141
- "loss": 2.4266,
142
- "step": 110925
143
- },
144
- {
145
- "epoch": 225.0,
146
- "eval_cer": 0.90995670995671,
147
- "eval_loss": 3.8467934131622314,
148
- "eval_runtime": 1.0035,
149
- "eval_samples_per_second": 209.258,
150
- "eval_steps_per_second": 26.905,
151
- "eval_wer": 1.0,
152
- "step": 110925
153
- },
154
- {
155
- "epoch": 250.0,
156
- "learning_rate": 4.355698278218093e-08,
157
- "loss": 2.4229,
158
- "step": 123250
159
- },
160
- {
161
- "epoch": 250.0,
162
- "eval_cer": 0.9116883116883117,
163
- "eval_loss": 3.849649667739868,
164
- "eval_runtime": 1.0002,
165
- "eval_samples_per_second": 209.958,
166
- "eval_steps_per_second": 26.995,
167
- "eval_wer": 1.0,
168
- "step": 123250
169
  }
170
  ],
171
- "max_steps": 123250,
172
- "num_train_epochs": 250,
173
- "total_flos": 1.1400455629774925e+20,
174
  "trial_name": null,
175
  "trial_params": null
176
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 10.0,
5
+ "global_step": 6160,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
+ "epoch": 10.0,
12
+ "learning_rate": 9.475051264524949e-05,
13
+ "loss": 4.1068,
14
+ "step": 6160
15
  },
16
  {
17
+ "epoch": 10.0,
18
+ "eval_cer": 0.47359307359307357,
19
+ "eval_loss": 4.263599395751953,
20
+ "eval_runtime": 7.5888,
21
+ "eval_samples_per_second": 27.672,
22
+ "eval_steps_per_second": 3.558,
23
+ "eval_wer": 0.8904761904761904,
24
+ "step": 6160
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
25
  }
26
  ],
27
+ "max_steps": 61600,
28
+ "num_train_epochs": 100,
29
+ "total_flos": 4.5525339060428145e+18,
30
  "trial_name": null,
31
  "trial_params": null
32
  }
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d1284c9db1fbd6ffd1a05741124b3d17a18ce5a697d22cde3b856c57d54e1290
3
- size 3119
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a93853e8d3350b9736431ab93f767de49f660529f7cab12962ec53dd998b74d7
3
+ size 3451
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ac76cdc6a11567deba22d2bf5690104a29bb9409be961b2f7cc85ec601ed2faf
3
- size 377641431
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a272e9147c0ac341d1a851b4f9beb9ad6e2a45b5ad4099cbb0bfb70cfe100965
3
+ size 377643361
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d1284c9db1fbd6ffd1a05741124b3d17a18ce5a697d22cde3b856c57d54e1290
3
- size 3119
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a93853e8d3350b9736431ab93f767de49f660529f7cab12962ec53dd998b74d7
3
+ size 3451