mprzibilla commited on
Commit
910915b
1 Parent(s): d641c34

Training in progress, step 25800

Browse files
config.json CHANGED
@@ -110,7 +110,7 @@
110
  1
111
  ],
112
  "torch_dtype": "float32",
113
- "transformers_version": "4.18.0",
114
  "use_weighted_layer_sum": false,
115
  "vocab_size": 27,
116
  "xvector_output_dim": 512
 
110
  1
111
  ],
112
  "torch_dtype": "float32",
113
+ "transformers_version": "4.23.1",
114
  "use_weighted_layer_sum": false,
115
  "vocab_size": 27,
116
  "xvector_output_dim": 512
last-checkpoint/config.json CHANGED
@@ -110,7 +110,7 @@
110
  1
111
  ],
112
  "torch_dtype": "float32",
113
- "transformers_version": "4.18.0",
114
  "use_weighted_layer_sum": false,
115
  "vocab_size": 27,
116
  "xvector_output_dim": 512
 
110
  1
111
  ],
112
  "torch_dtype": "float32",
113
+ "transformers_version": "4.23.1",
114
  "use_weighted_layer_sum": false,
115
  "vocab_size": 27,
116
  "xvector_output_dim": 512
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ac937a33dea6ea7a219a5d92302391d3b62c72a19f9ff5c54c2bed1c61cdffac
3
- size 168159
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83701acb6b969bf186789b560373efc2306622973b3c28a8ae14621fa8ea2af9
3
+ size 168299
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:970781c36183b1552822b1fd90733e765d39fc56d7e083aa21858cc68f2befee
3
- size 377641431
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e53a60ab51721dbacf39cfe0fd8f5d7e000d712c291b9c6468f589550314653
3
+ size 377643361
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1bc4c868be43b8aee478444845fee509627b8673243a867ffa21afdae158b023
3
- size 14567
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6bedc183fe4b3bee6a401ca9cd239cd2f5a261e21b1e0d0d190c9670c2192b2c
3
+ size 14639
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8e7828115df4dda4d48eed4e47399971a9187269fd1c501ef2b68aaf29a23048
3
- size 559
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fca9a24db2a129accee9ab827e1ed658add9ad4e2fd21ae130da0a36eb96656d
3
+ size 557
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c3fd97d7f7086d7e8d98ca6ed02a950b267fc075dbd24b6b2d7d971d9f49782e
3
- size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:384a9da4de591fb6eb7e3456e25f511cec76615b35d913dc0427c74b105c1704
3
+ size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,176 +1,32 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 1000.0,
5
- "global_step": 258000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
  "epoch": 100.0,
12
- "learning_rate": 9.47421460628315e-05,
13
- "loss": 13.3002,
14
  "step": 25800
15
  },
16
  {
17
  "epoch": 100.0,
18
- "eval_cer": 0.9238095238095239,
19
- "eval_loss": 2.9116570949554443,
20
- "eval_runtime": 1.0237,
21
- "eval_samples_per_second": 205.13,
22
- "eval_steps_per_second": 26.374,
23
  "eval_wer": 1.0,
24
  "step": 25800
25
- },
26
- {
27
- "epoch": 200.0,
28
- "learning_rate": 8.422072623419012e-05,
29
- "loss": 2.265,
30
- "step": 51600
31
- },
32
- {
33
- "epoch": 200.0,
34
- "eval_cer": 0.8943722943722944,
35
- "eval_loss": 2.9009172916412354,
36
- "eval_runtime": 1.0094,
37
- "eval_samples_per_second": 208.04,
38
- "eval_steps_per_second": 26.748,
39
- "eval_wer": 1.0,
40
- "step": 51600
41
- },
42
- {
43
- "epoch": 300.0,
44
- "learning_rate": 7.369889840881273e-05,
45
- "loss": 2.1533,
46
- "step": 77400
47
- },
48
- {
49
- "epoch": 300.0,
50
- "eval_cer": 0.8943722943722944,
51
- "eval_loss": 2.9222800731658936,
52
- "eval_runtime": 1.046,
53
- "eval_samples_per_second": 200.77,
54
- "eval_steps_per_second": 25.813,
55
- "eval_wer": 1.0,
56
- "step": 77400
57
- },
58
- {
59
- "epoch": 400.0,
60
- "learning_rate": 6.317747858017135e-05,
61
- "loss": 2.0998,
62
- "step": 103200
63
- },
64
- {
65
- "epoch": 400.0,
66
- "eval_cer": 0.8891774891774892,
67
- "eval_loss": 2.927011489868164,
68
- "eval_runtime": 1.0056,
69
- "eval_samples_per_second": 208.822,
70
- "eval_steps_per_second": 26.849,
71
- "eval_wer": 1.0,
72
- "step": 103200
73
- },
74
- {
75
- "epoch": 500.0,
76
- "learning_rate": 5.265565075479396e-05,
77
- "loss": 2.0687,
78
- "step": 129000
79
- },
80
- {
81
- "epoch": 500.0,
82
- "eval_cer": 0.8891774891774892,
83
- "eval_loss": 2.9528825283050537,
84
- "eval_runtime": 1.0218,
85
- "eval_samples_per_second": 205.522,
86
- "eval_steps_per_second": 26.424,
87
- "eval_wer": 1.0,
88
- "step": 129000
89
- },
90
- {
91
- "epoch": 600.0,
92
- "learning_rate": 4.2133822929416564e-05,
93
- "loss": 2.0491,
94
- "step": 154800
95
- },
96
- {
97
- "epoch": 600.0,
98
- "eval_cer": 0.8883116883116883,
99
- "eval_loss": 2.966721296310425,
100
- "eval_runtime": 1.0092,
101
- "eval_samples_per_second": 208.075,
102
- "eval_steps_per_second": 26.753,
103
- "eval_wer": 1.0,
104
- "step": 154800
105
- },
106
- {
107
- "epoch": 700.0,
108
- "learning_rate": 3.1611995104039174e-05,
109
- "loss": 2.0368,
110
- "step": 180600
111
- },
112
- {
113
- "epoch": 700.0,
114
- "eval_cer": 0.8874458874458875,
115
- "eval_loss": 2.9711692333221436,
116
- "eval_runtime": 1.0054,
117
- "eval_samples_per_second": 208.874,
118
- "eval_steps_per_second": 26.855,
119
- "eval_wer": 1.0,
120
- "step": 180600
121
- },
122
- {
123
- "epoch": 800.0,
124
- "learning_rate": 2.1089759281925745e-05,
125
- "loss": 2.0271,
126
- "step": 206400
127
- },
128
- {
129
- "epoch": 800.0,
130
- "eval_cer": 0.8874458874458875,
131
- "eval_loss": 2.976341724395752,
132
- "eval_runtime": 1.0209,
133
- "eval_samples_per_second": 205.708,
134
- "eval_steps_per_second": 26.448,
135
- "eval_wer": 1.0,
136
- "step": 206400
137
- },
138
- {
139
- "epoch": 900.0,
140
- "learning_rate": 1.0567523459812321e-05,
141
- "loss": 2.0223,
142
- "step": 232200
143
- },
144
- {
145
- "epoch": 900.0,
146
- "eval_cer": 0.8883116883116883,
147
- "eval_loss": 2.9786393642425537,
148
- "eval_runtime": 1.0096,
149
- "eval_samples_per_second": 207.998,
150
- "eval_steps_per_second": 26.743,
151
- "eval_wer": 1.0,
152
- "step": 232200
153
- },
154
- {
155
- "epoch": 1000.0,
156
- "learning_rate": 4.569563443492452e-08,
157
- "loss": 2.0195,
158
- "step": 258000
159
- },
160
- {
161
- "epoch": 1000.0,
162
- "eval_cer": 0.8883116883116883,
163
- "eval_loss": 2.979724645614624,
164
- "eval_runtime": 0.9979,
165
- "eval_samples_per_second": 210.433,
166
- "eval_steps_per_second": 27.056,
167
- "eval_wer": 1.0,
168
- "step": 258000
169
  }
170
  ],
171
  "max_steps": 258000,
172
  "num_train_epochs": 1000,
173
- "total_flos": 2.393792072555994e+20,
174
  "trial_name": null,
175
  "trial_params": null
176
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 100.0,
5
+ "global_step": 25800,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
  "epoch": 100.0,
12
+ "learning_rate": 0.0004737107303141575,
13
+ "loss": 7.8597,
14
  "step": 25800
15
  },
16
  {
17
  "epoch": 100.0,
18
+ "eval_cer": 0.8900432900432901,
19
+ "eval_loss": 2.9528822898864746,
20
+ "eval_runtime": 7.7723,
21
+ "eval_samples_per_second": 27.019,
22
+ "eval_steps_per_second": 3.474,
23
  "eval_wer": 1.0,
24
  "step": 25800
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
25
  }
26
  ],
27
  "max_steps": 258000,
28
  "num_train_epochs": 1000,
29
+ "total_flos": 2.393393666838634e+19,
30
  "trial_name": null,
31
  "trial_params": null
32
  }
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:04ede9c1209942d838657385fae4d8de498ffc12e29e19e23dbbe5f1462ebc93
3
- size 3119
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cceccd22d2aabb29bc215bed86135bf7eb5b60193a7883cd6d1ae8c8d22b66a1
3
+ size 3387
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:970781c36183b1552822b1fd90733e765d39fc56d7e083aa21858cc68f2befee
3
- size 377641431
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e53a60ab51721dbacf39cfe0fd8f5d7e000d712c291b9c6468f589550314653
3
+ size 377643361
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:04ede9c1209942d838657385fae4d8de498ffc12e29e19e23dbbe5f1462ebc93
3
- size 3119
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cceccd22d2aabb29bc215bed86135bf7eb5b60193a7883cd6d1ae8c8d22b66a1
3
+ size 3387