mprzibilla commited on
Commit
f965a08
·
1 Parent(s): 6c69b84

Training in progress, step 42810

Browse files
config.json CHANGED
@@ -110,7 +110,7 @@
110
  1
111
  ],
112
  "torch_dtype": "float32",
113
- "transformers_version": "4.18.0",
114
  "use_weighted_layer_sum": false,
115
  "vocab_size": 27,
116
  "xvector_output_dim": 512
 
110
  1
111
  ],
112
  "torch_dtype": "float32",
113
+ "transformers_version": "4.23.1",
114
  "use_weighted_layer_sum": false,
115
  "vocab_size": 27,
116
  "xvector_output_dim": 512
last-checkpoint/config.json CHANGED
@@ -110,7 +110,7 @@
110
  1
111
  ],
112
  "torch_dtype": "float32",
113
- "transformers_version": "4.18.0",
114
  "use_weighted_layer_sum": false,
115
  "vocab_size": 27,
116
  "xvector_output_dim": 512
 
110
  1
111
  ],
112
  "torch_dtype": "float32",
113
+ "transformers_version": "4.23.1",
114
  "use_weighted_layer_sum": false,
115
  "vocab_size": 27,
116
  "xvector_output_dim": 512
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c6ac29af520d5b2c069e2f7210724ba20e90c5f6f39bc3151aa9d5293bef63a0
3
- size 168159
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:abd1f7f1d403297755f3d5195182f64066b3cbb14ad9df999173a8b2f6e7e8ea
3
+ size 721655813
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2015c73f6c80fbd0a2ba632ff719eda3740f56cbcaf2a3e5487334058ef0a285
3
- size 377641431
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0181507564a84d0fc009847c4a6d46858cec8fce11b23062e1354e25fc731f5c
3
+ size 377643361
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f9cb857b45444ea61e5d59104fd2a2497b5a0c76c5450fc0dec3c98b46cbf46b
3
- size 14567
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aaff527cca738862a3889886f51982fcadd6245064e289441c0eaa95ec6106e0
3
+ size 14639
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:53b4faa452efd0a4a469d55ad9c163be9464d5bc46c60bd640b8de4bf05f76ce
3
- size 559
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:97493d56a553721cad772ef2f326ac53e7a9868c5f23452c6a85ca3f0f2d22ee
3
+ size 557
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:66dfc18c5043e3149c14c5c2e4388023eb1538d8f034288e82cfe5d1c38745f5
3
- size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f49cc27f208749ba85176e054a1f70b78d9840311ad2659b2725be6de92e8534
3
+ size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,176 +1,32 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 100.0,
5
- "global_step": 342500,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
  "epoch": 10.0,
12
- "learning_rate": 9.474237418363428e-05,
13
- "loss": 13.0104,
14
- "step": 34250
15
  },
16
  {
17
  "epoch": 10.0,
18
- "eval_cer": 0.9922077922077922,
19
- "eval_loss": 3.114701747894287,
20
- "eval_runtime": 0.6909,
21
- "eval_samples_per_second": 202.628,
22
- "eval_steps_per_second": 26.052,
23
- "eval_wer": 1.0,
24
- "step": 34250
25
- },
26
- {
27
- "epoch": 20.0,
28
- "learning_rate": 8.422005378409528e-05,
29
- "loss": 2.7462,
30
- "step": 68500
31
- },
32
- {
33
- "epoch": 20.0,
34
- "eval_cer": 0.9896103896103896,
35
- "eval_loss": 3.1291749477386475,
36
- "eval_runtime": 0.6768,
37
- "eval_samples_per_second": 206.855,
38
- "eval_steps_per_second": 26.596,
39
- "eval_wer": 1.0,
40
- "step": 68500
41
- },
42
- {
43
- "epoch": 30.0,
44
- "learning_rate": 7.369804072224357e-05,
45
- "loss": 2.676,
46
- "step": 102750
47
- },
48
- {
49
- "epoch": 30.0,
50
- "eval_cer": 0.987012987012987,
51
- "eval_loss": 3.133396863937378,
52
- "eval_runtime": 0.6746,
53
- "eval_samples_per_second": 207.544,
54
- "eval_steps_per_second": 26.684,
55
- "eval_wer": 1.0,
56
- "step": 102750
57
- },
58
- {
59
- "epoch": 40.0,
60
- "learning_rate": 6.317572032270458e-05,
61
- "loss": 2.649,
62
- "step": 137000
63
- },
64
- {
65
- "epoch": 40.0,
66
- "eval_cer": 0.9831168831168832,
67
- "eval_loss": 3.13140869140625,
68
- "eval_runtime": 0.6742,
69
- "eval_samples_per_second": 207.644,
70
- "eval_steps_per_second": 26.697,
71
- "eval_wer": 1.0,
72
- "step": 137000
73
- },
74
- {
75
- "epoch": 50.0,
76
- "learning_rate": 5.2652785247791016e-05,
77
- "loss": 2.6338,
78
- "step": 171250
79
- },
80
- {
81
- "epoch": 50.0,
82
- "eval_cer": 0.9844155844155844,
83
- "eval_loss": 3.1373016834259033,
84
- "eval_runtime": 0.6758,
85
- "eval_samples_per_second": 207.177,
86
- "eval_steps_per_second": 26.637,
87
- "eval_wer": 1.0,
88
- "step": 171250
89
- },
90
- {
91
- "epoch": 60.0,
92
- "learning_rate": 4.213107952362659e-05,
93
- "loss": 2.6245,
94
- "step": 205500
95
- },
96
- {
97
- "epoch": 60.0,
98
- "eval_cer": 0.9831168831168832,
99
- "eval_loss": 3.1429381370544434,
100
- "eval_runtime": 0.6795,
101
- "eval_samples_per_second": 206.043,
102
- "eval_steps_per_second": 26.491,
103
- "eval_wer": 1.0,
104
- "step": 205500
105
- },
106
- {
107
- "epoch": 70.0,
108
- "learning_rate": 3.160937379946216e-05,
109
- "loss": 2.619,
110
- "step": 239750
111
- },
112
- {
113
- "epoch": 70.0,
114
- "eval_cer": 0.9831168831168832,
115
- "eval_loss": 3.1534180641174316,
116
- "eval_runtime": 0.6752,
117
- "eval_samples_per_second": 207.339,
118
- "eval_steps_per_second": 26.658,
119
- "eval_wer": 1.0,
120
- "step": 239750
121
- },
122
- {
123
- "epoch": 80.0,
124
- "learning_rate": 2.108705339992317e-05,
125
- "loss": 2.6147,
126
- "step": 274000
127
- },
128
- {
129
- "epoch": 80.0,
130
- "eval_cer": 0.9844155844155844,
131
- "eval_loss": 3.146252155303955,
132
- "eval_runtime": 0.6763,
133
- "eval_samples_per_second": 207.007,
134
- "eval_steps_per_second": 26.615,
135
- "eval_wer": 1.0,
136
- "step": 274000
137
- },
138
- {
139
- "epoch": 90.0,
140
- "learning_rate": 1.056534767575874e-05,
141
- "loss": 2.6115,
142
- "step": 308250
143
- },
144
- {
145
- "epoch": 90.0,
146
- "eval_cer": 0.9831168831168832,
147
- "eval_loss": 3.1405744552612305,
148
- "eval_runtime": 0.6771,
149
- "eval_samples_per_second": 206.768,
150
- "eval_steps_per_second": 26.584,
151
- "eval_wer": 1.0,
152
- "step": 308250
153
- },
154
- {
155
- "epoch": 100.0,
156
- "learning_rate": 4.333461390703035e-08,
157
- "loss": 2.6102,
158
- "step": 342500
159
- },
160
- {
161
- "epoch": 100.0,
162
- "eval_cer": 0.9831168831168832,
163
- "eval_loss": 3.1426713466644287,
164
- "eval_runtime": 0.6615,
165
- "eval_samples_per_second": 211.646,
166
- "eval_steps_per_second": 27.212,
167
- "eval_wer": 1.0,
168
- "step": 342500
169
  }
170
  ],
171
- "max_steps": 342500,
172
  "num_train_epochs": 100,
173
- "total_flos": 3.2538079241368614e+20,
174
  "trial_name": null,
175
  "trial_params": null
176
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 10.0,
5
+ "global_step": 42810,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
  "epoch": 10.0,
12
+ "learning_rate": 9.474151391091605e-05,
13
+ "loss": 2.6003,
14
+ "step": 42810
15
  },
16
  {
17
  "epoch": 10.0,
18
+ "eval_cer": 0.8103896103896104,
19
+ "eval_loss": 4.999092102050781,
20
+ "eval_runtime": 5.1797,
21
+ "eval_samples_per_second": 27.029,
22
+ "eval_steps_per_second": 3.475,
23
+ "eval_wer": 0.9142857142857143,
24
+ "step": 42810
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
25
  }
26
  ],
27
+ "max_steps": 428100,
28
  "num_train_epochs": 100,
29
+ "total_flos": 3.2399059329860952e+19,
30
  "trial_name": null,
31
  "trial_params": null
32
  }
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4bcd8c032f4a5e4bcadd8bc2ab6e77f3af4dc94f7fcec7d8f1bbc6210bc9d629
3
- size 3119
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9145f12772e3151c498dd0872c61d0f5e569349f097fa28226c40c4cf0a531a
3
+ size 3451
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2015c73f6c80fbd0a2ba632ff719eda3740f56cbcaf2a3e5487334058ef0a285
3
- size 377641431
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0181507564a84d0fc009847c4a6d46858cec8fce11b23062e1354e25fc731f5c
3
+ size 377643361
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4bcd8c032f4a5e4bcadd8bc2ab6e77f3af4dc94f7fcec7d8f1bbc6210bc9d629
3
- size 3119
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9145f12772e3151c498dd0872c61d0f5e569349f097fa28226c40c4cf0a531a
3
+ size 3451