Rakib commited on
Commit
ccd97db
1 Parent(s): 5c20d4e

Training in progress, step 1000

Browse files
Files changed (41) hide show
  1. README.md +0 -60
  2. added_tokens.json +0 -108
  3. all_results.json +0 -13
  4. best_model/tokenizer_config.json +1 -1
  5. config.json +1 -1
  6. eval_results.json +0 -9
  7. generation_config.json +0 -222
  8. merges.txt +0 -0
  9. my-training.py +13 -13
  10. normalizer.json +0 -1742
  11. pytorch_model.bin +1 -1
  12. runs/May15_12-08-38_DESKTOP-OD7C1Q6/1684130924.7925029/events.out.tfevents.1684130924.DESKTOP-OD7C1Q6 +0 -3
  13. runs/May15_12-08-38_DESKTOP-OD7C1Q6/events.out.tfevents.1684130924.DESKTOP-OD7C1Q6 +0 -3
  14. runs/May15_12-15-25_DESKTOP-OD7C1Q6/1684131331.9202273/events.out.tfevents.1684131331.DESKTOP-OD7C1Q6 +0 -3
  15. runs/May15_12-15-25_DESKTOP-OD7C1Q6/events.out.tfevents.1684131331.DESKTOP-OD7C1Q6 +0 -3
  16. runs/May15_13-19-50_DESKTOP-OD7C1Q6/1684135196.836124/events.out.tfevents.1684135196.DESKTOP-OD7C1Q6 +0 -3
  17. runs/May15_13-19-50_DESKTOP-OD7C1Q6/events.out.tfevents.1684135196.DESKTOP-OD7C1Q6 +0 -3
  18. runs/May15_13-32-25_DESKTOP-OD7C1Q6/1684135953.274833/events.out.tfevents.1684135953.DESKTOP-OD7C1Q6 +0 -3
  19. runs/May15_13-32-25_DESKTOP-OD7C1Q6/events.out.tfevents.1684135953.DESKTOP-OD7C1Q6 +0 -3
  20. runs/May15_14-04-02_DESKTOP-OD7C1Q6/1684137848.1832855/events.out.tfevents.1684137848.DESKTOP-OD7C1Q6 +0 -3
  21. runs/May15_14-04-02_DESKTOP-OD7C1Q6/events.out.tfevents.1684137848.DESKTOP-OD7C1Q6 +0 -3
  22. runs/May15_14-48-43_DESKTOP-OD7C1Q6/1684140528.8114798/events.out.tfevents.1684140528.DESKTOP-OD7C1Q6 +0 -3
  23. runs/May15_14-48-43_DESKTOP-OD7C1Q6/events.out.tfevents.1684140528.DESKTOP-OD7C1Q6 +0 -3
  24. runs/May15_14-59-56_DESKTOP-OD7C1Q6/1684141202.0174327/events.out.tfevents.1684141202.DESKTOP-OD7C1Q6 +0 -3
  25. runs/May15_14-59-56_DESKTOP-OD7C1Q6/events.out.tfevents.1684141202.DESKTOP-OD7C1Q6 +0 -3
  26. runs/May15_15-12-20_DESKTOP-OD7C1Q6/1684141947.2878134/events.out.tfevents.1684141947.DESKTOP-OD7C1Q6 +0 -3
  27. runs/May15_15-12-20_DESKTOP-OD7C1Q6/events.out.tfevents.1684141947.DESKTOP-OD7C1Q6 +0 -3
  28. runs/May15_15-29-19_DESKTOP-OD7C1Q6/1684142964.8228638/events.out.tfevents.1684142964.DESKTOP-OD7C1Q6 +0 -3
  29. runs/May15_15-29-19_DESKTOP-OD7C1Q6/events.out.tfevents.1684142964.DESKTOP-OD7C1Q6 +0 -3
  30. runs/May15_15-47-11_DESKTOP-OD7C1Q6/1684144037.0687504/events.out.tfevents.1684144037.DESKTOP-OD7C1Q6 +0 -3
  31. runs/May15_15-47-11_DESKTOP-OD7C1Q6/events.out.tfevents.1684144037.DESKTOP-OD7C1Q6 +0 -3
  32. runs/May15_15-47-11_DESKTOP-OD7C1Q6/events.out.tfevents.1684144731.DESKTOP-OD7C1Q6 +0 -3
  33. runs/{May13_23-09-22_DESKTOP-OD7C1Q6/1683997770.2403045/events.out.tfevents.1683997770.DESKTOP-OD7C1Q6 → May15_16-55-04_DESKTOP-OD7C1Q6/1684148109.9478214/events.out.tfevents.1684148109.DESKTOP-OD7C1Q6} +2 -2
  34. runs/{May13_23-09-22_DESKTOP-OD7C1Q6/events.out.tfevents.1683997770.DESKTOP-OD7C1Q6 → May15_16-55-04_DESKTOP-OD7C1Q6/events.out.tfevents.1684148109.DESKTOP-OD7C1Q6} +2 -2
  35. runs/{May15_11-17-07_DESKTOP-OD7C1Q6/1684127833.5408869/events.out.tfevents.1684127833.DESKTOP-OD7C1Q6 → May15_22-40-19_DESKTOP-OD7C1Q6/1684168824.9625106/events.out.tfevents.1684168824.DESKTOP-OD7C1Q6} +2 -2
  36. runs/{May15_11-17-07_DESKTOP-OD7C1Q6/events.out.tfevents.1684127833.DESKTOP-OD7C1Q6 → May15_22-40-19_DESKTOP-OD7C1Q6/events.out.tfevents.1684168824.DESKTOP-OD7C1Q6} +2 -2
  37. special_tokens_map.json +0 -133
  38. tokenizer_config.json +0 -35
  39. train_results.json +0 -7
  40. trainer_state.json +0 -37
  41. training_args.bin +2 -2
README.md DELETED
@@ -1,60 +0,0 @@
1
- ---
2
- license: apache-2.0
3
- tags:
4
- - generated_from_trainer
5
- metrics:
6
- - wer
7
- model-index:
8
- - name: openai/whisper-small
9
- results: []
10
- ---
11
-
12
- <!-- This model card has been generated automatically according to the information the Trainer had access to. You
13
- should probably proofread and complete it, then remove this comment. -->
14
-
15
- # openai/whisper-small
16
-
17
- This model is a fine-tuned version of [openai/whisper-small](https://huggingface.co/openai/whisper-small) on the None dataset.
18
- It achieves the following results on the evaluation set:
19
- - Loss: 1.9569
20
- - Cer: 304.7818
21
- - Wer: 369.68
22
-
23
- ## Model description
24
-
25
- More information needed
26
-
27
- ## Intended uses & limitations
28
-
29
- More information needed
30
-
31
- ## Training and evaluation data
32
-
33
- More information needed
34
-
35
- ## Training procedure
36
-
37
- ### Training hyperparameters
38
-
39
- The following hyperparameters were used during training:
40
- - learning_rate: 1e-05
41
- - train_batch_size: 4
42
- - eval_batch_size: 32
43
- - seed: 42
44
- - gradient_accumulation_steps: 16
45
- - total_train_batch_size: 64
46
- - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
47
- - lr_scheduler_type: cosine
48
- - lr_scheduler_warmup_steps: 1000
49
- - training_steps: 50
50
-
51
- ### Training results
52
-
53
-
54
-
55
- ### Framework versions
56
-
57
- - Transformers 4.28.0.dev0
58
- - Pytorch 2.0.0+cu117
59
- - Datasets 2.10.2.dev0
60
- - Tokenizers 0.13.2
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
added_tokens.json DELETED
@@ -1,108 +0,0 @@
1
- {
2
- "<|af|>": 50327,
3
- "<|am|>": 50334,
4
- "<|ar|>": 50272,
5
- "<|as|>": 50350,
6
- "<|az|>": 50304,
7
- "<|ba|>": 50355,
8
- "<|be|>": 50330,
9
- "<|bg|>": 50292,
10
- "<|bn|>": 50302,
11
- "<|bo|>": 50347,
12
- "<|br|>": 50309,
13
- "<|bs|>": 50315,
14
- "<|ca|>": 50270,
15
- "<|cs|>": 50283,
16
- "<|cy|>": 50297,
17
- "<|da|>": 50285,
18
- "<|de|>": 50261,
19
- "<|el|>": 50281,
20
- "<|en|>": 50259,
21
- "<|es|>": 50262,
22
- "<|et|>": 50307,
23
- "<|eu|>": 50310,
24
- "<|fa|>": 50300,
25
- "<|fi|>": 50277,
26
- "<|fo|>": 50338,
27
- "<|fr|>": 50265,
28
- "<|gl|>": 50319,
29
- "<|gu|>": 50333,
30
- "<|haw|>": 50352,
31
- "<|ha|>": 50354,
32
- "<|he|>": 50279,
33
- "<|hi|>": 50276,
34
- "<|hr|>": 50291,
35
- "<|ht|>": 50339,
36
- "<|hu|>": 50286,
37
- "<|hy|>": 50312,
38
- "<|id|>": 50275,
39
- "<|is|>": 50311,
40
- "<|it|>": 50274,
41
- "<|ja|>": 50266,
42
- "<|jw|>": 50356,
43
- "<|ka|>": 50329,
44
- "<|kk|>": 50316,
45
- "<|km|>": 50323,
46
- "<|kn|>": 50306,
47
- "<|ko|>": 50264,
48
- "<|la|>": 50294,
49
- "<|lb|>": 50345,
50
- "<|ln|>": 50353,
51
- "<|lo|>": 50336,
52
- "<|lt|>": 50293,
53
- "<|lv|>": 50301,
54
- "<|mg|>": 50349,
55
- "<|mi|>": 50295,
56
- "<|mk|>": 50308,
57
- "<|ml|>": 50296,
58
- "<|mn|>": 50314,
59
- "<|mr|>": 50320,
60
- "<|ms|>": 50282,
61
- "<|mt|>": 50343,
62
- "<|my|>": 50346,
63
- "<|ne|>": 50313,
64
- "<|nl|>": 50271,
65
- "<|nn|>": 50342,
66
- "<|nocaptions|>": 50362,
67
- "<|notimestamps|>": 50363,
68
- "<|no|>": 50288,
69
- "<|oc|>": 50328,
70
- "<|pa|>": 50321,
71
- "<|pl|>": 50269,
72
- "<|ps|>": 50340,
73
- "<|pt|>": 50267,
74
- "<|ro|>": 50284,
75
- "<|ru|>": 50263,
76
- "<|sa|>": 50344,
77
- "<|sd|>": 50332,
78
- "<|si|>": 50322,
79
- "<|sk|>": 50298,
80
- "<|sl|>": 50305,
81
- "<|sn|>": 50324,
82
- "<|so|>": 50326,
83
- "<|sq|>": 50317,
84
- "<|sr|>": 50303,
85
- "<|startoflm|>": 50360,
86
- "<|startofprev|>": 50361,
87
- "<|startoftranscript|>": 50258,
88
- "<|su|>": 50357,
89
- "<|sv|>": 50273,
90
- "<|sw|>": 50318,
91
- "<|ta|>": 50287,
92
- "<|te|>": 50299,
93
- "<|tg|>": 50331,
94
- "<|th|>": 50289,
95
- "<|tk|>": 50341,
96
- "<|tl|>": 50348,
97
- "<|transcribe|>": 50359,
98
- "<|translate|>": 50358,
99
- "<|tr|>": 50268,
100
- "<|tt|>": 50351,
101
- "<|uk|>": 50280,
102
- "<|ur|>": 50290,
103
- "<|uz|>": 50337,
104
- "<|vi|>": 50278,
105
- "<|yi|>": 50335,
106
- "<|yo|>": 50325,
107
- "<|zh|>": 50260
108
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
all_results.json DELETED
@@ -1,13 +0,0 @@
1
- {
2
- "epoch": 1.31,
3
- "eval_cer": 304.78184991274,
4
- "eval_loss": 1.9569354057312012,
5
- "eval_runtime": 28.0459,
6
- "eval_samples_per_second": 1.783,
7
- "eval_steps_per_second": 0.071,
8
- "eval_wer": 369.68,
9
- "train_loss": 2.721541290283203,
10
- "train_runtime": 665.7853,
11
- "train_samples_per_second": 4.806,
12
- "train_steps_per_second": 0.075
13
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
best_model/tokenizer_config.json CHANGED
@@ -9,6 +9,7 @@
9
  "rstrip": false,
10
  "single_word": false
11
  },
 
12
  "eos_token": {
13
  "__type": "AddedToken",
14
  "content": "<|endoftext|>",
@@ -22,7 +23,6 @@
22
  "pad_token": null,
23
  "processor_class": "WhisperProcessor",
24
  "return_attention_mask": false,
25
- "special_tokens_map_file": null,
26
  "tokenizer_class": "WhisperTokenizer",
27
  "unk_token": {
28
  "__type": "AddedToken",
 
9
  "rstrip": false,
10
  "single_word": false
11
  },
12
+ "clean_up_tokenization_spaces": true,
13
  "eos_token": {
14
  "__type": "AddedToken",
15
  "content": "<|endoftext|>",
 
23
  "pad_token": null,
24
  "processor_class": "WhisperProcessor",
25
  "return_attention_mask": false,
 
26
  "tokenizer_class": "WhisperTokenizer",
27
  "unk_token": {
28
  "__type": "AddedToken",
config.json CHANGED
@@ -44,7 +44,7 @@
44
  "scale_embedding": false,
45
  "suppress_tokens": [],
46
  "torch_dtype": "float32",
47
- "transformers_version": "4.28.0.dev0",
48
  "use_cache": true,
49
  "use_weighted_layer_sum": false,
50
  "vocab_size": 51865
 
44
  "scale_embedding": false,
45
  "suppress_tokens": [],
46
  "torch_dtype": "float32",
47
+ "transformers_version": "4.30.0.dev0",
48
  "use_cache": true,
49
  "use_weighted_layer_sum": false,
50
  "vocab_size": 51865
eval_results.json DELETED
@@ -1,9 +0,0 @@
1
- {
2
- "epoch": 1.31,
3
- "eval_cer": 304.78184991274,
4
- "eval_loss": 1.9569354057312012,
5
- "eval_runtime": 28.0459,
6
- "eval_samples_per_second": 1.783,
7
- "eval_steps_per_second": 0.071,
8
- "eval_wer": 369.68
9
- }
 
 
 
 
 
 
 
 
 
 
generation_config.json DELETED
@@ -1,222 +0,0 @@
1
- {
2
- "begin_suppress_tokens": [
3
- 220,
4
- 50257
5
- ],
6
- "bos_token_id": 50257,
7
- "decoder_start_token_id": 50258,
8
- "eos_token_id": 50257,
9
- "forced_decoder_ids": [
10
- [
11
- 1,
12
- null
13
- ],
14
- [
15
- 2,
16
- 50359
17
- ]
18
- ],
19
- "is_multilingual": true,
20
- "lang_to_id": {
21
- "<|af|>": 50327,
22
- "<|am|>": 50334,
23
- "<|ar|>": 50272,
24
- "<|as|>": 50350,
25
- "<|az|>": 50304,
26
- "<|ba|>": 50355,
27
- "<|be|>": 50330,
28
- "<|bg|>": 50292,
29
- "<|bn|>": 50302,
30
- "<|bo|>": 50347,
31
- "<|br|>": 50309,
32
- "<|bs|>": 50315,
33
- "<|ca|>": 50270,
34
- "<|cs|>": 50283,
35
- "<|cy|>": 50297,
36
- "<|da|>": 50285,
37
- "<|de|>": 50261,
38
- "<|el|>": 50281,
39
- "<|en|>": 50259,
40
- "<|es|>": 50262,
41
- "<|et|>": 50307,
42
- "<|eu|>": 50310,
43
- "<|fa|>": 50300,
44
- "<|fi|>": 50277,
45
- "<|fo|>": 50338,
46
- "<|fr|>": 50265,
47
- "<|gl|>": 50319,
48
- "<|gu|>": 50333,
49
- "<|haw|>": 50352,
50
- "<|ha|>": 50354,
51
- "<|he|>": 50279,
52
- "<|hi|>": 50276,
53
- "<|hr|>": 50291,
54
- "<|ht|>": 50339,
55
- "<|hu|>": 50286,
56
- "<|hy|>": 50312,
57
- "<|id|>": 50275,
58
- "<|is|>": 50311,
59
- "<|it|>": 50274,
60
- "<|ja|>": 50266,
61
- "<|jw|>": 50356,
62
- "<|ka|>": 50329,
63
- "<|kk|>": 50316,
64
- "<|km|>": 50323,
65
- "<|kn|>": 50306,
66
- "<|ko|>": 50264,
67
- "<|la|>": 50294,
68
- "<|lb|>": 50345,
69
- "<|ln|>": 50353,
70
- "<|lo|>": 50336,
71
- "<|lt|>": 50293,
72
- "<|lv|>": 50301,
73
- "<|mg|>": 50349,
74
- "<|mi|>": 50295,
75
- "<|mk|>": 50308,
76
- "<|ml|>": 50296,
77
- "<|mn|>": 50314,
78
- "<|mr|>": 50320,
79
- "<|ms|>": 50282,
80
- "<|mt|>": 50343,
81
- "<|my|>": 50346,
82
- "<|ne|>": 50313,
83
- "<|nl|>": 50271,
84
- "<|nn|>": 50342,
85
- "<|no|>": 50288,
86
- "<|oc|>": 50328,
87
- "<|pa|>": 50321,
88
- "<|pl|>": 50269,
89
- "<|ps|>": 50340,
90
- "<|pt|>": 50267,
91
- "<|ro|>": 50284,
92
- "<|ru|>": 50263,
93
- "<|sa|>": 50344,
94
- "<|sd|>": 50332,
95
- "<|si|>": 50322,
96
- "<|sk|>": 50298,
97
- "<|sl|>": 50305,
98
- "<|sn|>": 50324,
99
- "<|so|>": 50326,
100
- "<|sq|>": 50317,
101
- "<|sr|>": 50303,
102
- "<|su|>": 50357,
103
- "<|sv|>": 50273,
104
- "<|sw|>": 50318,
105
- "<|ta|>": 50287,
106
- "<|te|>": 50299,
107
- "<|tg|>": 50331,
108
- "<|th|>": 50289,
109
- "<|tk|>": 50341,
110
- "<|tl|>": 50348,
111
- "<|tr|>": 50268,
112
- "<|tt|>": 50351,
113
- "<|uk|>": 50280,
114
- "<|ur|>": 50290,
115
- "<|uz|>": 50337,
116
- "<|vi|>": 50278,
117
- "<|yi|>": 50335,
118
- "<|yo|>": 50325,
119
- "<|zh|>": 50260
120
- },
121
- "max_initial_timestamp_index": 1,
122
- "max_length": 448,
123
- "max_new_tokens": 448,
124
- "no_timestamps_token_id": 50363,
125
- "pad_token_id": 50257,
126
- "return_timestamps": false,
127
- "suppress_tokens": [
128
- 1,
129
- 2,
130
- 7,
131
- 8,
132
- 9,
133
- 10,
134
- 14,
135
- 25,
136
- 26,
137
- 27,
138
- 28,
139
- 29,
140
- 31,
141
- 58,
142
- 59,
143
- 60,
144
- 61,
145
- 62,
146
- 63,
147
- 90,
148
- 91,
149
- 92,
150
- 93,
151
- 359,
152
- 503,
153
- 522,
154
- 542,
155
- 873,
156
- 893,
157
- 902,
158
- 918,
159
- 922,
160
- 931,
161
- 1350,
162
- 1853,
163
- 1982,
164
- 2460,
165
- 2627,
166
- 3246,
167
- 3253,
168
- 3268,
169
- 3536,
170
- 3846,
171
- 3961,
172
- 4183,
173
- 4667,
174
- 6585,
175
- 6647,
176
- 7273,
177
- 9061,
178
- 9383,
179
- 10428,
180
- 10929,
181
- 11938,
182
- 12033,
183
- 12331,
184
- 12562,
185
- 13793,
186
- 14157,
187
- 14635,
188
- 15265,
189
- 15618,
190
- 16553,
191
- 16604,
192
- 18362,
193
- 18956,
194
- 20075,
195
- 21675,
196
- 22520,
197
- 26130,
198
- 26161,
199
- 26435,
200
- 28279,
201
- 29464,
202
- 31650,
203
- 32302,
204
- 32470,
205
- 36865,
206
- 42863,
207
- 47425,
208
- 49870,
209
- 50254,
210
- 50258,
211
- 50358,
212
- 50359,
213
- 50360,
214
- 50361,
215
- 50362
216
- ],
217
- "task_to_id": {
218
- "transcribe": 50359,
219
- "translate": 50358
220
- },
221
- "transformers_version": "4.28.0.dev0"
222
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
merges.txt DELETED
The diff for this file is too large to render. See raw diff
 
my-training.py CHANGED
@@ -57,9 +57,9 @@ print(f"\n\n Loading {model_name} for {language} to {task}...this might take a w
57
  ## 3. Setting Up Training Args
58
  output_dir = "./"
59
  overwrite_output_dir = True
60
- max_steps = 50
61
  # max_steps = 5
62
- per_device_train_batch_size = 4
63
  # per_device_train_batch_size = 1
64
  per_device_eval_batch_size = 32
65
  # per_device_eval_batch_size = 1
@@ -69,14 +69,14 @@ dataloader_num_workers = 0 #Default: 0 and 0 for Windows
69
  gradient_checkpointing = False
70
  evaluation_strategy ="steps"
71
  # eval_steps = 5
72
- eval_steps = 100
73
  save_strategy = "steps"
74
- save_steps = 100
75
  # save_steps = 5
76
  save_total_limit = 5
77
  learning_rate = 1e-5
78
  lr_scheduler_type = "cosine" # "constant", "constant_with_warmup", "cosine", "cosine_with_restarts", "linear"(default), "polynomial", "inverse_sqrt"
79
- warmup_steps = 1000 # (1 epoch)
80
  # warmup_steps = 1
81
  logging_steps = 25
82
  # logging_steps = 1
@@ -90,7 +90,7 @@ bf16 = True
90
  # bf16 = False
91
  tf32 = True
92
  # tf32 = False
93
- generation_max_length = 448 # ensure that the generation_max_length is equal to model_max_length. model_max_length = 1024 for whisper-small (see tokenizer config.json) also make model.config.max_length = 1024
94
  report_to = ["tensorboard"]
95
  predict_with_generate = True
96
  push_to_hub = True
@@ -320,8 +320,9 @@ my_dataset["train"] = concatenate_datasets([my_dataset["train"], augmented_raw_t
320
  my_dataset["train"] = my_dataset["train"].shuffle(seed=42)
321
 
322
 
323
- my_dataset["train"] = my_dataset["train"].select(range(2500))
324
- my_dataset["test"] = my_dataset["test"].select(range(50))
 
325
 
326
  print("\n\n AFTER AUGMENTATION, FINAL train and validation sets are: ")
327
  print("\n FINAL DATASET: \n")
@@ -337,6 +338,7 @@ from transformers import WhisperFeatureExtractor, WhisperTokenizer, WhisperToken
337
 
338
  feature_extractor = WhisperFeatureExtractor.from_pretrained(model_name)
339
 
 
340
  # tokenizer = WhisperTokenizer.from_pretrained(model_name, language=language, task=task)
341
  # tokenizer = WhisperTokenizerFast.from_pretrained(model_name, language=language, task=task)
342
 
@@ -388,7 +390,6 @@ def prepare_dataset(batch):
388
 
389
  # compute input length
390
  batch["input_length"] = len(batch["audio"])
391
- # batch["input_length"] = len(batch["input_features"])
392
 
393
  # if spec augmentation applied, get attention_mask to guide the mask along time axis
394
  if apply_spec_augment:
@@ -426,8 +427,8 @@ my_dataset = my_dataset.map(prepare_dataset,
426
  num_proc=1, # if num_proc>1, then mapping might get stuck. use num_proc=1 in that case.
427
  load_from_cache_file=True,
428
  cache_file_names={
429
- "train" : os.path.join(base_dir, 'datasets_cache', 'lol_preprocessed_train_cache.arrow'),
430
- "test" : os.path.join(base_dir, 'datasets_cache', 'lol_preprocessed_test_cache.arrow'),
431
  }
432
  )
433
  ## OR this,
@@ -473,7 +474,7 @@ print("\n\n AFTER FILTERING INPUTS, final train and validation sets are: ")
473
  print(my_dataset)
474
  print("\n")
475
 
476
- max_label_length = generation_max_length #(max_label_length should be equal to generation_max_length)
477
 
478
  def filter_labels(labels_length):
479
  """Filter label sequences longer than max length (448)"""
@@ -643,7 +644,6 @@ if freeze_feature_encoder:
643
  model.freeze_feature_encoder()
644
 
645
  model.generation_config.max_length = generation_max_length
646
- model.generation_config.max_new_tokens = generation_max_length
647
 
648
  ## 16. Define the Training Configuration
649
  from transformers import Seq2SeqTrainingArguments
 
57
  ## 3. Setting Up Training Args
58
  output_dir = "./"
59
  overwrite_output_dir = True
60
+ max_steps = 40000
61
  # max_steps = 5
62
+ per_device_train_batch_size = 4
63
  # per_device_train_batch_size = 1
64
  per_device_eval_batch_size = 32
65
  # per_device_eval_batch_size = 1
 
69
  gradient_checkpointing = False
70
  evaluation_strategy ="steps"
71
  # eval_steps = 5
72
+ eval_steps = 1000
73
  save_strategy = "steps"
74
+ save_steps = 1000
75
  # save_steps = 5
76
  save_total_limit = 5
77
  learning_rate = 1e-5
78
  lr_scheduler_type = "cosine" # "constant", "constant_with_warmup", "cosine", "cosine_with_restarts", "linear"(default), "polynomial", "inverse_sqrt"
79
+ warmup_steps = 8000 # (1 epoch)
80
  # warmup_steps = 1
81
  logging_steps = 25
82
  # logging_steps = 1
 
90
  # bf16 = False
91
  tf32 = True
92
  # tf32 = False
93
+ generation_max_length = 448 # ensure that the generation_max_length is equal to model max_length. model max_length = 448 for whisper-small (see config.json).
94
  report_to = ["tensorboard"]
95
  predict_with_generate = True
96
  push_to_hub = True
 
320
  my_dataset["train"] = my_dataset["train"].shuffle(seed=42)
321
 
322
 
323
+ # For debugging
324
+ # my_dataset["train"] = my_dataset["train"].select(range(2500, 5000))
325
+ # my_dataset["test"] = my_dataset["test"].select(range(50))
326
 
327
  print("\n\n AFTER AUGMENTATION, FINAL train and validation sets are: ")
328
  print("\n FINAL DATASET: \n")
 
338
 
339
  feature_extractor = WhisperFeatureExtractor.from_pretrained(model_name)
340
 
341
+ ## No need as tokenizer gets already loaded while loading the processor
342
  # tokenizer = WhisperTokenizer.from_pretrained(model_name, language=language, task=task)
343
  # tokenizer = WhisperTokenizerFast.from_pretrained(model_name, language=language, task=task)
344
 
 
390
 
391
  # compute input length
392
  batch["input_length"] = len(batch["audio"])
 
393
 
394
  # if spec augmentation applied, get attention_mask to guide the mask along time axis
395
  if apply_spec_augment:
 
427
  num_proc=1, # if num_proc>1, then mapping might get stuck. use num_proc=1 in that case.
428
  load_from_cache_file=True,
429
  cache_file_names={
430
+ "train" : os.path.join(base_dir, 'datasets_cache', 'preprocessed_train_cache.arrow'),
431
+ "test" : os.path.join(base_dir, 'datasets_cache', 'preprocessed_test_cache.arrow'),
432
  }
433
  )
434
  ## OR this,
 
474
  print(my_dataset)
475
  print("\n")
476
 
477
+ max_label_length = generation_max_length #(max_label_length should be equal to max_length of model which is equal to generation_max_length)
478
 
479
  def filter_labels(labels_length):
480
  """Filter label sequences longer than max length (448)"""
 
644
  model.freeze_feature_encoder()
645
 
646
  model.generation_config.max_length = generation_max_length
 
647
 
648
  ## 16. Define the Training Configuration
649
  from transformers import Seq2SeqTrainingArguments
normalizer.json DELETED
@@ -1,1742 +0,0 @@
1
- {
2
- "accessorise": "accessorize",
3
- "accessorised": "accessorized",
4
- "accessorises": "accessorizes",
5
- "accessorising": "accessorizing",
6
- "acclimatisation": "acclimatization",
7
- "acclimatise": "acclimatize",
8
- "acclimatised": "acclimatized",
9
- "acclimatises": "acclimatizes",
10
- "acclimatising": "acclimatizing",
11
- "accoutrements": "accouterments",
12
- "aeon": "eon",
13
- "aeons": "eons",
14
- "aerogramme": "aerogram",
15
- "aerogrammes": "aerograms",
16
- "aeroplane": "airplane",
17
- "aeroplanes": "airplanes",
18
- "aesthete": "esthete",
19
- "aesthetes": "esthetes",
20
- "aesthetic": "esthetic",
21
- "aesthetically": "esthetically",
22
- "aesthetics": "esthetics",
23
- "aetiology": "etiology",
24
- "ageing": "aging",
25
- "aggrandisement": "aggrandizement",
26
- "agonise": "agonize",
27
- "agonised": "agonized",
28
- "agonises": "agonizes",
29
- "agonising": "agonizing",
30
- "agonisingly": "agonizingly",
31
- "almanack": "almanac",
32
- "almanacks": "almanacs",
33
- "aluminium": "aluminum",
34
- "amortisable": "amortizable",
35
- "amortisation": "amortization",
36
- "amortisations": "amortizations",
37
- "amortise": "amortize",
38
- "amortised": "amortized",
39
- "amortises": "amortizes",
40
- "amortising": "amortizing",
41
- "amphitheatre": "amphitheater",
42
- "amphitheatres": "amphitheaters",
43
- "anaemia": "anemia",
44
- "anaemic": "anemic",
45
- "anaesthesia": "anesthesia",
46
- "anaesthetic": "anesthetic",
47
- "anaesthetics": "anesthetics",
48
- "anaesthetise": "anesthetize",
49
- "anaesthetised": "anesthetized",
50
- "anaesthetises": "anesthetizes",
51
- "anaesthetising": "anesthetizing",
52
- "anaesthetist": "anesthetist",
53
- "anaesthetists": "anesthetists",
54
- "anaesthetize": "anesthetize",
55
- "anaesthetized": "anesthetized",
56
- "anaesthetizes": "anesthetizes",
57
- "anaesthetizing": "anesthetizing",
58
- "analogue": "analog",
59
- "analogues": "analogs",
60
- "analyse": "analyze",
61
- "analysed": "analyzed",
62
- "analyses": "analyzes",
63
- "analysing": "analyzing",
64
- "anglicise": "anglicize",
65
- "anglicised": "anglicized",
66
- "anglicises": "anglicizes",
67
- "anglicising": "anglicizing",
68
- "annualised": "annualized",
69
- "antagonise": "antagonize",
70
- "antagonised": "antagonized",
71
- "antagonises": "antagonizes",
72
- "antagonising": "antagonizing",
73
- "apologise": "apologize",
74
- "apologised": "apologized",
75
- "apologises": "apologizes",
76
- "apologising": "apologizing",
77
- "appal": "appall",
78
- "appals": "appalls",
79
- "appetiser": "appetizer",
80
- "appetisers": "appetizers",
81
- "appetising": "appetizing",
82
- "appetisingly": "appetizingly",
83
- "arbour": "arbor",
84
- "arbours": "arbors",
85
- "archaeologically": "archeologically",
86
- "archaeologist": "archeologist",
87
- "archaeologists": "archeologists",
88
- "archaeology": "archeology</span>",
89
- "archeological": "archaeological",
90
- "ardour": "ardor",
91
- "armour": "armor",
92
- "armoured": "armored",
93
- "armourer": "armorer",
94
- "armourers": "armorers",
95
- "armouries": "armories",
96
- "armoury": "armory",
97
- "artefact": "artifact",
98
- "artefacts": "artifacts",
99
- "authorise": "authorize",
100
- "authorised": "authorized",
101
- "authorises": "authorizes",
102
- "authorising": "authorizing",
103
- "axe": "ax",
104
- "backpedalled": "backpedaled",
105
- "backpedalling": "backpedaling",
106
- "bannister": "banister",
107
- "bannisters": "banisters",
108
- "baptise": "baptize",
109
- "baptised": "baptized",
110
- "baptises": "baptizes",
111
- "baptising": "baptizing",
112
- "bastardise": "bastardize",
113
- "bastardised": "bastardized",
114
- "bastardises": "bastardizes",
115
- "bastardising": "bastardizing",
116
- "battleax": "battleaxe",
117
- "baulk": "balk",
118
- "baulked": "balked",
119
- "baulking": "balking",
120
- "baulks": "balks",
121
- "bedevilled": "bedeviled",
122
- "bedevilling": "bedeviling",
123
- "behaviour": "behavior",
124
- "behavioural": "behavioral",
125
- "behaviourism": "behaviorism",
126
- "behaviourist": "behaviorist",
127
- "behaviourists": "behaviorists",
128
- "behaviours": "behaviors",
129
- "behove": "behoove",
130
- "behoved": "behooved",
131
- "behoves": "behooves",
132
- "bejewelled": "bejeweled",
133
- "belabour": "belabor",
134
- "belaboured": "belabored",
135
- "belabouring": "belaboring",
136
- "belabours": "belabors",
137
- "bevelled": "beveled",
138
- "bevvies": "bevies",
139
- "bevvy": "bevy",
140
- "biassed": "biased",
141
- "biassing": "biasing",
142
- "bingeing": "binging",
143
- "bougainvillaea": "bougainvillea",
144
- "bougainvillaeas": "bougainvilleas",
145
- "bowdlerise": "bowdlerize",
146
- "bowdlerised": "bowdlerized",
147
- "bowdlerises": "bowdlerizes",
148
- "bowdlerising": "bowdlerizing",
149
- "breathalyse": "breathalyze",
150
- "breathalysed": "breathalyzed",
151
- "breathalyser": "breathalyzer",
152
- "breathalysers": "breathalyzers",
153
- "breathalyses": "breathalyzes",
154
- "breathalysing": "breathalyzing",
155
- "brutalise": "brutalize",
156
- "brutalised": "brutalized",
157
- "brutalises": "brutalizes",
158
- "brutalising": "brutalizing",
159
- "busses": "buses",
160
- "bussing": "busing",
161
- "caesarean": "cesarean",
162
- "caesareans": "cesareans",
163
- "calibre": "caliber",
164
- "calibres": "calibers",
165
- "calliper": "caliper",
166
- "callipers": "calipers",
167
- "callisthenics": "calisthenics",
168
- "canalise": "canalize",
169
- "canalised": "canalized",
170
- "canalises": "canalizes",
171
- "canalising": "canalizing",
172
- "cancelation": "cancellation",
173
- "cancelations": "cancellations",
174
- "cancelled": "canceled",
175
- "cancelling": "canceling",
176
- "candour": "candor",
177
- "cannibalise": "cannibalize",
178
- "cannibalised": "cannibalized",
179
- "cannibalises": "cannibalizes",
180
- "cannibalising": "cannibalizing",
181
- "canonise": "canonize",
182
- "canonised": "canonized",
183
- "canonises": "canonizes",
184
- "canonising": "canonizing",
185
- "capitalise": "capitalize",
186
- "capitalised": "capitalized",
187
- "capitalises": "capitalizes",
188
- "capitalising": "capitalizing",
189
- "caramelise": "caramelize",
190
- "caramelised": "caramelized",
191
- "caramelises": "caramelizes",
192
- "caramelising": "caramelizing",
193
- "carbonise": "carbonize",
194
- "carbonised": "carbonized",
195
- "carbonises": "carbonizes",
196
- "carbonising": "carbonizing",
197
- "carolled": "caroled",
198
- "carolling": "caroling",
199
- "catalogue": "catalog",
200
- "catalogued": "cataloged",
201
- "catalogues": "catalogs",
202
- "cataloguing": "cataloging",
203
- "catalyse": "catalyze",
204
- "catalysed": "catalyzed",
205
- "catalyses": "catalyzes",
206
- "catalysing": "catalyzing",
207
- "categorise": "categorize",
208
- "categorised": "categorized",
209
- "categorises": "categorizes",
210
- "categorising": "categorizing",
211
- "cauterise": "cauterize",
212
- "cauterised": "cauterized",
213
- "cauterises": "cauterizes",
214
- "cauterising": "cauterizing",
215
- "cavilled": "caviled",
216
- "cavilling": "caviling",
217
- "centigramme": "centigram",
218
- "centigrammes": "centigrams",
219
- "centilitre": "centiliter",
220
- "centilitres": "centiliters",
221
- "centimetre": "centimeter",
222
- "centimetres": "centimeters",
223
- "centralise": "centralize",
224
- "centralised": "centralized",
225
- "centralises": "centralizes",
226
- "centralising": "centralizing",
227
- "centre": "center",
228
- "centred": "centered",
229
- "centrefold": "centerfold",
230
- "centrefolds": "centerfolds",
231
- "centrepiece": "centerpiece",
232
- "centrepieces": "centerpieces",
233
- "centres": "centers",
234
- "channelled": "channeled",
235
- "channelling": "channeling",
236
- "characterise": "characterize",
237
- "characterised": "characterized",
238
- "characterises": "characterizes",
239
- "characterising": "characterizing",
240
- "cheque": "check",
241
- "chequebook": "checkbook",
242
- "chequebooks": "checkbooks",
243
- "chequered": "checkered",
244
- "cheques": "checks",
245
- "chilli": "chili",
246
- "chimaera": "chimera",
247
- "chimaeras": "chimeras",
248
- "chiselled": "chiseled",
249
- "chiselling": "chiseling",
250
- "circularise": "circularize",
251
- "circularised": "circularized",
252
- "circularises": "circularizes",
253
- "circularising": "circularizing",
254
- "civilise": "civilize",
255
- "civilised": "civilized",
256
- "civilises": "civilizes",
257
- "civilising": "civilizing",
258
- "clamour": "clamor",
259
- "clamoured": "clamored",
260
- "clamouring": "clamoring",
261
- "clamours": "clamors",
262
- "clangour": "clangor",
263
- "clarinettist": "clarinetist",
264
- "clarinettists": "clarinetists",
265
- "collectivise": "collectivize",
266
- "collectivised": "collectivized",
267
- "collectivises": "collectivizes",
268
- "collectivising": "collectivizing",
269
- "colonisation": "colonization",
270
- "colonise": "colonize",
271
- "colonised": "colonized",
272
- "coloniser": "colonizer",
273
- "colonisers": "colonizers",
274
- "colonises": "colonizes",
275
- "colonising": "colonizing",
276
- "colour": "color",
277
- "colourant": "colorant",
278
- "colourants": "colorants",
279
- "coloured": "colored",
280
- "coloureds": "coloreds",
281
- "colourful": "colorful",
282
- "colourfully": "colorfully",
283
- "colouring": "coloring",
284
- "colourize": "colorize",
285
- "colourized": "colorized",
286
- "colourizes": "colorizes",
287
- "colourizing": "colorizing",
288
- "colourless": "colorless",
289
- "colours": "colors",
290
- "commercialise": "commercialize",
291
- "commercialised": "commercialized",
292
- "commercialises": "commercializes",
293
- "commercialising": "commercializing",
294
- "compartmentalise": "compartmentalize",
295
- "compartmentalised": "compartmentalized",
296
- "compartmentalises": "compartmentalizes",
297
- "compartmentalising": "compartmentalizing",
298
- "computerise": "computerize",
299
- "computerised": "computerized",
300
- "computerises": "computerizes",
301
- "computerising": "computerizing",
302
- "conceptualise": "conceptualize",
303
- "conceptualised": "conceptualized",
304
- "conceptualises": "conceptualizes",
305
- "conceptualising": "conceptualizing",
306
- "connexion": "connection",
307
- "connexions": "connections",
308
- "contextualise": "contextualize",
309
- "contextualised": "contextualized",
310
- "contextualises": "contextualizes",
311
- "contextualising": "contextualizing",
312
- "cosier": "cozier",
313
- "cosies": "cozies",
314
- "cosiest": "coziest",
315
- "cosily": "cozily",
316
- "cosiness": "coziness",
317
- "cosy": "cozy",
318
- "councillor": "councilor",
319
- "councillors": "councilors",
320
- "counselled": "counseled",
321
- "counselling": "counseling",
322
- "counsellor": "counselor",
323
- "counsellors": "counselors",
324
- "crenelated": "crenellated",
325
- "criminalise": "criminalize",
326
- "criminalised": "criminalized",
327
- "criminalises": "criminalizes",
328
- "criminalising": "criminalizing",
329
- "criticise": "criticize",
330
- "criticised": "criticized",
331
- "criticises": "criticizes",
332
- "criticising": "criticizing",
333
- "crueller": "crueler",
334
- "cruellest": "cruelest",
335
- "crystallisation": "crystallization",
336
- "crystallise": "crystallize",
337
- "crystallised": "crystallized",
338
- "crystallises": "crystallizes",
339
- "crystallising": "crystallizing",
340
- "cudgelled": "cudgeled",
341
- "cudgelling": "cudgeling",
342
- "customise": "customize",
343
- "customised": "customized",
344
- "customises": "customizes",
345
- "customising": "customizing",
346
- "cypher": "cipher",
347
- "cyphers": "ciphers",
348
- "decentralisation": "decentralization",
349
- "decentralise": "decentralize",
350
- "decentralised": "decentralized",
351
- "decentralises": "decentralizes",
352
- "decentralising": "decentralizing",
353
- "decriminalisation": "decriminalization",
354
- "decriminalise": "decriminalize",
355
- "decriminalised": "decriminalized",
356
- "decriminalises": "decriminalizes",
357
- "decriminalising": "decriminalizing",
358
- "defence": "defense",
359
- "defenceless": "defenseless",
360
- "defences": "defenses",
361
- "dehumanisation": "dehumanization",
362
- "dehumanise": "dehumanize",
363
- "dehumanised": "dehumanized",
364
- "dehumanises": "dehumanizes",
365
- "dehumanising": "dehumanizing",
366
- "demeanour": "demeanor",
367
- "demilitarisation": "demilitarization",
368
- "demilitarise": "demilitarize",
369
- "demilitarised": "demilitarized",
370
- "demilitarises": "demilitarizes",
371
- "demilitarising": "demilitarizing",
372
- "demobilisation": "demobilization",
373
- "demobilise": "demobilize",
374
- "demobilised": "demobilized",
375
- "demobilises": "demobilizes",
376
- "demobilising": "demobilizing",
377
- "democratisation": "democratization",
378
- "democratise": "democratize",
379
- "democratised": "democratized",
380
- "democratises": "democratizes",
381
- "democratising": "democratizing",
382
- "demonise": "demonize",
383
- "demonised": "demonized",
384
- "demonises": "demonizes",
385
- "demonising": "demonizing",
386
- "demoralisation": "demoralization",
387
- "demoralise": "demoralize",
388
- "demoralised": "demoralized",
389
- "demoralises": "demoralizes",
390
- "demoralising": "demoralizing",
391
- "denationalisation": "denationalization",
392
- "denationalise": "denationalize",
393
- "denationalised": "denationalized",
394
- "denationalises": "denationalizes",
395
- "denationalising": "denationalizing",
396
- "deodorise": "deodorize",
397
- "deodorised": "deodorized",
398
- "deodorises": "deodorizes",
399
- "deodorising": "deodorizing",
400
- "depersonalise": "depersonalize",
401
- "depersonalised": "depersonalized",
402
- "depersonalises": "depersonalizes",
403
- "depersonalising": "depersonalizing",
404
- "deputise": "deputize",
405
- "deputised": "deputized",
406
- "deputises": "deputizes",
407
- "deputising": "deputizing",
408
- "desensitisation": "desensitization",
409
- "desensitise": "desensitize",
410
- "desensitised": "desensitized",
411
- "desensitises": "desensitizes",
412
- "desensitising": "desensitizing",
413
- "destabilisation": "destabilization",
414
- "destabilise": "destabilize",
415
- "destabilised": "destabilized",
416
- "destabilises": "destabilizes",
417
- "destabilising": "destabilizing",
418
- "dialled": "dialed",
419
- "dialling": "dialing",
420
- "dialogue": "dialog",
421
- "dialogues": "dialogs",
422
- "diarrhoea": "diarrhea",
423
- "digitise": "digitize",
424
- "digitised": "digitized",
425
- "digitises": "digitizes",
426
- "digitising": "digitizing",
427
- "disc": "disk",
428
- "discolour": "discolor",
429
- "discoloured": "discolored",
430
- "discolouring": "discoloring",
431
- "discolours": "discolors",
432
- "discs": "disks",
433
- "disembowelled": "disemboweled",
434
- "disembowelling": "disemboweling",
435
- "disfavour": "disfavor",
436
- "dishevelled": "disheveled",
437
- "dishonour": "dishonor",
438
- "dishonourable": "dishonorable",
439
- "dishonourably": "dishonorably",
440
- "dishonoured": "dishonored",
441
- "dishonouring": "dishonoring",
442
- "dishonours": "dishonors",
443
- "disorganisation": "disorganization",
444
- "disorganised": "disorganized",
445
- "distil": "distill",
446
- "distils": "distills",
447
- "dramatisation": "dramatization",
448
- "dramatisations": "dramatizations",
449
- "dramatise": "dramatize",
450
- "dramatised": "dramatized",
451
- "dramatises": "dramatizes",
452
- "dramatising": "dramatizing",
453
- "draught": "draft",
454
- "draughtboard": "draftboard",
455
- "draughtboards": "draftboards",
456
- "draughtier": "draftier",
457
- "draughtiest": "draftiest",
458
- "draughts": "drafts",
459
- "draughtsman": "draftsman",
460
- "draughtsmanship": "draftsmanship",
461
- "draughtsmen": "draftsmen",
462
- "draughtswoman": "draftswoman",
463
- "draughtswomen": "draftswomen",
464
- "draughty": "drafty",
465
- "drivelled": "driveled",
466
- "drivelling": "driveling",
467
- "duelled": "dueled",
468
- "duelling": "dueling",
469
- "economise": "economize",
470
- "economised": "economized",
471
- "economises": "economizes",
472
- "economising": "economizing",
473
- "editorialise": "editorialize",
474
- "editorialised": "editorialized",
475
- "editorialises": "editorializes",
476
- "editorialising": "editorializing",
477
- "edoema": "edema",
478
- "empathise": "empathize",
479
- "empathised": "empathized",
480
- "empathises": "empathizes",
481
- "empathising": "empathizing",
482
- "emphasise": "emphasize",
483
- "emphasised": "emphasized",
484
- "emphasises": "emphasizes",
485
- "emphasising": "emphasizing",
486
- "enamelled": "enameled",
487
- "enamelling": "enameling",
488
- "enamoured": "enamored",
489
- "encyclopaedia": "encyclopedia",
490
- "encyclopaedias": "encyclopedias",
491
- "encyclopaedic": "encyclopedic",
492
- "endeavour": "endeavor",
493
- "endeavoured": "endeavored",
494
- "endeavouring": "endeavoring",
495
- "endeavours": "endeavors",
496
- "energise": "energize",
497
- "energised": "energized",
498
- "energises": "energizes",
499
- "energising": "energizing",
500
- "enrol": "enroll",
501
- "enrols": "enrolls",
502
- "enthral": "enthrall",
503
- "enthrals": "enthralls",
504
- "epaulette": "epaulet",
505
- "epaulettes": "epaulets",
506
- "epicentre": "epicenter",
507
- "epicentres": "epicenters",
508
- "epilogue": "epilog",
509
- "epilogues": "epilogs",
510
- "epitomise": "epitomize",
511
- "epitomised": "epitomized",
512
- "epitomises": "epitomizes",
513
- "epitomising": "epitomizing",
514
- "equalisation": "equalization",
515
- "equalise": "equalize",
516
- "equalised": "equalized",
517
- "equaliser": "equalizer",
518
- "equalisers": "equalizers",
519
- "equalises": "equalizes",
520
- "equalising": "equalizing",
521
- "eulogise": "eulogize",
522
- "eulogised": "eulogized",
523
- "eulogises": "eulogizes",
524
- "eulogising": "eulogizing",
525
- "evangelise": "evangelize",
526
- "evangelised": "evangelized",
527
- "evangelises": "evangelizes",
528
- "evangelising": "evangelizing",
529
- "exorcise": "exorcize",
530
- "exorcised": "exorcized",
531
- "exorcises": "exorcizes",
532
- "exorcising": "exorcizing",
533
- "extemporisation": "extemporization",
534
- "extemporise": "extemporize",
535
- "extemporised": "extemporized",
536
- "extemporises": "extemporizes",
537
- "extemporising": "extemporizing",
538
- "externalisation": "externalization",
539
- "externalisations": "externalizations",
540
- "externalise": "externalize",
541
- "externalised": "externalized",
542
- "externalises": "externalizes",
543
- "externalising": "externalizing",
544
- "factorise": "factorize",
545
- "factorised": "factorized",
546
- "factorises": "factorizes",
547
- "factorising": "factorizing",
548
- "faecal": "fecal",
549
- "faeces": "feces",
550
- "familiarisation": "familiarization",
551
- "familiarise": "familiarize",
552
- "familiarised": "familiarized",
553
- "familiarises": "familiarizes",
554
- "familiarising": "familiarizing",
555
- "fantasise": "fantasize",
556
- "fantasised": "fantasized",
557
- "fantasises": "fantasizes",
558
- "fantasising": "fantasizing",
559
- "favour": "favor",
560
- "favourable": "favorable",
561
- "favourably": "favorably",
562
- "favoured": "favored",
563
- "favouring": "favoring",
564
- "favourite": "favorite",
565
- "favourites": "favorites",
566
- "favouritism": "favoritism",
567
- "favours": "favors",
568
- "feminise": "feminize",
569
- "feminised": "feminized",
570
- "feminises": "feminizes",
571
- "feminising": "feminizing",
572
- "fertilisation": "fertilization",
573
- "fertilise": "fertilize",
574
- "fertilised": "fertilized",
575
- "fertiliser": "fertilizer",
576
- "fertilisers": "fertilizers",
577
- "fertilises": "fertilizes",
578
- "fertilising": "fertilizing",
579
- "fervour": "fervor",
580
- "fibre": "fiber",
581
- "fibreglass": "fiberglass",
582
- "fibres": "fibers",
583
- "fictionalisation": "fictionalization",
584
- "fictionalisations": "fictionalizations",
585
- "fictionalise": "fictionalize",
586
- "fictionalised": "fictionalized",
587
- "fictionalises": "fictionalizes",
588
- "fictionalising": "fictionalizing",
589
- "fillet": "filet",
590
- "filleted": "fileted",
591
- "filleting": "fileting",
592
- "fillets": "filets",
593
- "finalisation": "finalization",
594
- "finalise": "finalize",
595
- "finalised": "finalized",
596
- "finalises": "finalizes",
597
- "finalising": "finalizing",
598
- "flautist": "flutist",
599
- "flautists": "flutists",
600
- "flavour": "flavor",
601
- "flavoured": "flavored",
602
- "flavouring": "flavoring",
603
- "flavourings": "flavorings",
604
- "flavourless": "flavorless",
605
- "flavours": "flavors",
606
- "flavoursome": "flavorsome",
607
- "flyer / flier": "flier / flyer",
608
- "foetal": "fetal",
609
- "foetid": "fetid",
610
- "foetus": "fetus",
611
- "foetuses": "fetuses",
612
- "formalisation": "formalization",
613
- "formalise": "formalize",
614
- "formalised": "formalized",
615
- "formalises": "formalizes",
616
- "formalising": "formalizing",
617
- "fossilisation": "fossilization",
618
- "fossilise": "fossilize",
619
- "fossilised": "fossilized",
620
- "fossilises": "fossilizes",
621
- "fossilising": "fossilizing",
622
- "fraternisation": "fraternization",
623
- "fraternise": "fraternize",
624
- "fraternised": "fraternized",
625
- "fraternises": "fraternizes",
626
- "fraternising": "fraternizing",
627
- "fulfil": "fulfill",
628
- "fulfilment": "fulfillment",
629
- "fulfils": "fulfills",
630
- "funnelled": "funneled",
631
- "funnelling": "funneling",
632
- "gage": "gauge",
633
- "gaged": "gauged",
634
- "gages": "gauges",
635
- "gaging": "gauging",
636
- "galvanise": "galvanize",
637
- "galvanised": "galvanized",
638
- "galvanises": "galvanizes",
639
- "galvanising": "galvanizing",
640
- "gambolled": "gamboled",
641
- "gambolling": "gamboling",
642
- "gaol": "jail",
643
- "gaolbird": "jailbird",
644
- "gaolbirds": "jailbirds",
645
- "gaolbreak": "jailbreak",
646
- "gaolbreaks": "jailbreaks",
647
- "gaoled": "jailed",
648
- "gaoler": "jailer",
649
- "gaolers": "jailers",
650
- "gaoling": "jailing",
651
- "gaols": "jails",
652
- "gasses": "gases",
653
- "generalisation": "generalization",
654
- "generalisations": "generalizations",
655
- "generalise": "generalize",
656
- "generalised": "generalized",
657
- "generalises": "generalizes",
658
- "generalising": "generalizing",
659
- "ghettoise": "ghettoize",
660
- "ghettoised": "ghettoized",
661
- "ghettoises": "ghettoizes",
662
- "ghettoising": "ghettoizing",
663
- "gipsies": "gypsies",
664
- "glamor": "glamour",
665
- "glamorise": "glamorize",
666
- "glamorised": "glamorized",
667
- "glamorises": "glamorizes",
668
- "glamorising": "glamorizing",
669
- "globalisation": "globalization",
670
- "globalise": "globalize",
671
- "globalised": "globalized",
672
- "globalises": "globalizes",
673
- "globalising": "globalizing",
674
- "glueing": "gluing",
675
- "goitre": "goiter",
676
- "goitres": "goiters",
677
- "gonorrhoea": "gonorrhea",
678
- "gramme": "gram",
679
- "grammes": "grams",
680
- "gravelled": "graveled",
681
- "grey": "gray",
682
- "greyed": "grayed",
683
- "greying": "graying",
684
- "greyish": "grayish",
685
- "greyness": "grayness",
686
- "greys": "grays",
687
- "grovelled": "groveled",
688
- "grovelling": "groveling",
689
- "groyne": "groin",
690
- "groynes": "groins",
691
- "gruelling": "grueling",
692
- "gruellingly": "gruelingly",
693
- "gryphon": "griffin",
694
- "gryphons": "griffins",
695
- "gynaecological": "gynecological",
696
- "gynaecologist": "gynecologist",
697
- "gynaecologists": "gynecologists",
698
- "gynaecology": "gynecology",
699
- "haematological": "hematological",
700
- "haematologist": "hematologist",
701
- "haematologists": "hematologists",
702
- "haematology": "hematology",
703
- "haemoglobin": "hemoglobin",
704
- "haemophilia": "hemophilia",
705
- "haemophiliac": "hemophiliac",
706
- "haemophiliacs": "hemophiliacs",
707
- "haemorrhage": "hemorrhage",
708
- "haemorrhaged": "hemorrhaged",
709
- "haemorrhages": "hemorrhages",
710
- "haemorrhaging": "hemorrhaging",
711
- "haemorrhoids": "hemorrhoids",
712
- "harbour": "harbor",
713
- "harboured": "harbored",
714
- "harbouring": "harboring",
715
- "harbours": "harbors",
716
- "harmonisation": "harmonization",
717
- "harmonise": "harmonize",
718
- "harmonised": "harmonized",
719
- "harmonises": "harmonizes",
720
- "harmonising": "harmonizing",
721
- "homoeopath": "homeopath",
722
- "homoeopathic": "homeopathic",
723
- "homoeopaths": "homeopaths",
724
- "homoeopathy": "homeopathy",
725
- "homogenise": "homogenize",
726
- "homogenised": "homogenized",
727
- "homogenises": "homogenizes",
728
- "homogenising": "homogenizing",
729
- "honour": "honor",
730
- "honourable": "honorable",
731
- "honourably": "honorably",
732
- "honoured": "honored",
733
- "honouring": "honoring",
734
- "honours": "honors",
735
- "hospitalisation": "hospitalization",
736
- "hospitalise": "hospitalize",
737
- "hospitalised": "hospitalized",
738
- "hospitalises": "hospitalizes",
739
- "hospitalising": "hospitalizing",
740
- "humanise": "humanize",
741
- "humanised": "humanized",
742
- "humanises": "humanizes",
743
- "humanising": "humanizing",
744
- "humour": "humor",
745
- "humoured": "humored",
746
- "humouring": "humoring",
747
- "humourless": "humorless",
748
- "humours": "humors",
749
- "hybridise": "hybridize",
750
- "hybridised": "hybridized",
751
- "hybridises": "hybridizes",
752
- "hybridising": "hybridizing",
753
- "hypnotise": "hypnotize",
754
- "hypnotised": "hypnotized",
755
- "hypnotises": "hypnotizes",
756
- "hypnotising": "hypnotizing",
757
- "hypothesise": "hypothesize",
758
- "hypothesised": "hypothesized",
759
- "hypothesises": "hypothesizes",
760
- "hypothesising": "hypothesizing",
761
- "idealisation": "idealization",
762
- "idealise": "idealize",
763
- "idealised": "idealized",
764
- "idealises": "idealizes",
765
- "idealising": "idealizing",
766
- "idolise": "idolize",
767
- "idolised": "idolized",
768
- "idolises": "idolizes",
769
- "idolising": "idolizing",
770
- "immobilisation": "immobilization",
771
- "immobilise": "immobilize",
772
- "immobilised": "immobilized",
773
- "immobiliser": "immobilizer",
774
- "immobilisers": "immobilizers",
775
- "immobilises": "immobilizes",
776
- "immobilising": "immobilizing",
777
- "immortalise": "immortalize",
778
- "immortalised": "immortalized",
779
- "immortalises": "immortalizes",
780
- "immortalising": "immortalizing",
781
- "immunisation": "immunization",
782
- "immunise": "immunize",
783
- "immunised": "immunized",
784
- "immunises": "immunizes",
785
- "immunising": "immunizing",
786
- "impanelled": "impaneled",
787
- "impanelling": "impaneling",
788
- "imperilled": "imperiled",
789
- "imperilling": "imperiling",
790
- "individualise": "individualize",
791
- "individualised": "individualized",
792
- "individualises": "individualizes",
793
- "individualising": "individualizing",
794
- "industrialise": "industrialize",
795
- "industrialised": "industrialized",
796
- "industrialises": "industrializes",
797
- "industrialising": "industrializing",
798
- "inflexion": "inflection",
799
- "inflexions": "inflections",
800
- "initialise": "initialize",
801
- "initialised": "initialized",
802
- "initialises": "initializes",
803
- "initialising": "initializing",
804
- "initialled": "initialed",
805
- "initialling": "initialing",
806
- "instal": "install",
807
- "instalment": "installment",
808
- "instalments": "installments",
809
- "instals": "installs",
810
- "instil": "instill",
811
- "instils": "instills",
812
- "institutionalisation": "institutionalization",
813
- "institutionalise": "institutionalize",
814
- "institutionalised": "institutionalized",
815
- "institutionalises": "institutionalizes",
816
- "institutionalising": "institutionalizing",
817
- "intellectualise": "intellectualize",
818
- "intellectualised": "intellectualized",
819
- "intellectualises": "intellectualizes",
820
- "intellectualising": "intellectualizing",
821
- "internalisation": "internalization",
822
- "internalise": "internalize",
823
- "internalised": "internalized",
824
- "internalises": "internalizes",
825
- "internalising": "internalizing",
826
- "internationalisation": "internationalization",
827
- "internationalise": "internationalize",
828
- "internationalised": "internationalized",
829
- "internationalises": "internationalizes",
830
- "internationalising": "internationalizing",
831
- "ionisation": "ionization",
832
- "ionise": "ionize",
833
- "ionised": "ionized",
834
- "ioniser": "ionizer",
835
- "ionisers": "ionizers",
836
- "ionises": "ionizes",
837
- "ionising": "ionizing",
838
- "italicise": "italicize",
839
- "italicised": "italicized",
840
- "italicises": "italicizes",
841
- "italicising": "italicizing",
842
- "itemise": "itemize",
843
- "itemised": "itemized",
844
- "itemises": "itemizes",
845
- "itemising": "itemizing",
846
- "jeopardise": "jeopardize",
847
- "jeopardised": "jeopardized",
848
- "jeopardises": "jeopardizes",
849
- "jeopardising": "jeopardizing",
850
- "jewelled": "jeweled",
851
- "jeweller": "jeweler",
852
- "jewellers": "jewelers",
853
- "jewellery": "jewelry",
854
- "judgement": "judgment",
855
- "kilogramme": "kilogram",
856
- "kilogrammes": "kilograms",
857
- "kilometre": "kilometer",
858
- "kilometres": "kilometers",
859
- "labelled": "labeled",
860
- "labelling": "labeling",
861
- "labour": "labor",
862
- "laboured": "labored",
863
- "labourer": "laborer",
864
- "labourers": "laborers",
865
- "labouring": "laboring",
866
- "labours": "labors",
867
- "lacklustre": "lackluster",
868
- "legalisation": "legalization",
869
- "legalise": "legalize",
870
- "legalised": "legalized",
871
- "legalises": "legalizes",
872
- "legalising": "legalizing",
873
- "legitimise": "legitimize",
874
- "legitimised": "legitimized",
875
- "legitimises": "legitimizes",
876
- "legitimising": "legitimizing",
877
- "leukaemia": "leukemia",
878
- "levelled": "leveled",
879
- "leveller": "leveler",
880
- "levellers": "levelers",
881
- "levelling": "leveling",
882
- "libelled": "libeled",
883
- "libelling": "libeling",
884
- "libellous": "libelous",
885
- "liberalisation": "liberalization",
886
- "liberalise": "liberalize",
887
- "liberalised": "liberalized",
888
- "liberalises": "liberalizes",
889
- "liberalising": "liberalizing",
890
- "licence": "license",
891
- "licenced": "licensed",
892
- "licences": "licenses",
893
- "licencing": "licensing",
894
- "likeable": "likable",
895
- "lionisation": "lionization",
896
- "lionise": "lionize",
897
- "lionised": "lionized",
898
- "lionises": "lionizes",
899
- "lionising": "lionizing",
900
- "liquidise": "liquidize",
901
- "liquidised": "liquidized",
902
- "liquidiser": "liquidizer",
903
- "liquidisers": "liquidizers",
904
- "liquidises": "liquidizes",
905
- "liquidising": "liquidizing",
906
- "litre": "liter",
907
- "litres": "liters",
908
- "localise": "localize",
909
- "localised": "localized",
910
- "localises": "localizes",
911
- "localising": "localizing",
912
- "louvre": "louver",
913
- "louvred": "louvered",
914
- "louvres": "louvers",
915
- "lustre": "luster",
916
- "magnetise": "magnetize",
917
- "magnetised": "magnetized",
918
- "magnetises": "magnetizes",
919
- "magnetising": "magnetizing",
920
- "manoeuvrability": "maneuverability",
921
- "manoeuvrable": "maneuverable",
922
- "manoeuvre": "maneuver",
923
- "manoeuvred": "maneuvered",
924
- "manoeuvres": "maneuvers",
925
- "manoeuvring": "maneuvering",
926
- "manoeuvrings": "maneuverings",
927
- "marginalisation": "marginalization",
928
- "marginalise": "marginalize",
929
- "marginalised": "marginalized",
930
- "marginalises": "marginalizes",
931
- "marginalising": "marginalizing",
932
- "marshalled": "marshaled",
933
- "marshalling": "marshaling",
934
- "marvelled": "marveled",
935
- "marvelling": "marveling",
936
- "marvellous": "marvelous",
937
- "marvellously": "marvelously",
938
- "materialisation": "materialization",
939
- "materialise": "materialize",
940
- "materialised": "materialized",
941
- "materialises": "materializes",
942
- "materialising": "materializing",
943
- "maximisation": "maximization",
944
- "maximise": "maximize",
945
- "maximised": "maximized",
946
- "maximises": "maximizes",
947
- "maximising": "maximizing",
948
- "meagre": "meager",
949
- "mechanisation": "mechanization",
950
- "mechanise": "mechanize",
951
- "mechanised": "mechanized",
952
- "mechanises": "mechanizes",
953
- "mechanising": "mechanizing",
954
- "mediaeval": "medieval",
955
- "memorialise": "memorialize",
956
- "memorialised": "memorialized",
957
- "memorialises": "memorializes",
958
- "memorialising": "memorializing",
959
- "memorise": "memorize",
960
- "memorised": "memorized",
961
- "memorises": "memorizes",
962
- "memorising": "memorizing",
963
- "mesmerise": "mesmerize",
964
- "mesmerised": "mesmerized",
965
- "mesmerises": "mesmerizes",
966
- "mesmerising": "mesmerizing",
967
- "metabolise": "metabolize",
968
- "metabolised": "metabolized",
969
- "metabolises": "metabolizes",
970
- "metabolising": "metabolizing",
971
- "metre": "meter",
972
- "metres": "meters",
973
- "mhm": "hmm",
974
- "micrometre": "micrometer",
975
- "micrometres": "micrometers",
976
- "militarise": "militarize",
977
- "militarised": "militarized",
978
- "militarises": "militarizes",
979
- "militarising": "militarizing",
980
- "milligramme": "milligram",
981
- "milligrammes": "milligrams",
982
- "millilitre": "milliliter",
983
- "millilitres": "milliliters",
984
- "millimetre": "millimeter",
985
- "millimetres": "millimeters",
986
- "miniaturisation": "miniaturization",
987
- "miniaturise": "miniaturize",
988
- "miniaturised": "miniaturized",
989
- "miniaturises": "miniaturizes",
990
- "miniaturising": "miniaturizing",
991
- "minibusses": "minibuses",
992
- "minimise": "minimize",
993
- "minimised": "minimized",
994
- "minimises": "minimizes",
995
- "minimising": "minimizing",
996
- "misbehaviour": "misbehavior",
997
- "misdemeanour": "misdemeanor",
998
- "misdemeanours": "misdemeanors",
999
- "misspelt": "misspelled",
1000
- "mitre": "miter",
1001
- "mitres": "miters",
1002
- "mm": "hmm",
1003
- "mmm": "hmm",
1004
- "mobilisation": "mobilization",
1005
- "mobilise": "mobilize",
1006
- "mobilised": "mobilized",
1007
- "mobilises": "mobilizes",
1008
- "mobilising": "mobilizing",
1009
- "modelled": "modeled",
1010
- "modeller": "modeler",
1011
- "modellers": "modelers",
1012
- "modelling": "modeling",
1013
- "modernise": "modernize",
1014
- "modernised": "modernized",
1015
- "modernises": "modernizes",
1016
- "modernising": "modernizing",
1017
- "moisturise": "moisturize",
1018
- "moisturised": "moisturized",
1019
- "moisturiser": "moisturizer",
1020
- "moisturisers": "moisturizers",
1021
- "moisturises": "moisturizes",
1022
- "moisturising": "moisturizing",
1023
- "monologue": "monolog",
1024
- "monologues": "monologs",
1025
- "monopolisation": "monopolization",
1026
- "monopolise": "monopolize",
1027
- "monopolised": "monopolized",
1028
- "monopolises": "monopolizes",
1029
- "monopolising": "monopolizing",
1030
- "moralise": "moralize",
1031
- "moralised": "moralized",
1032
- "moralises": "moralizes",
1033
- "moralising": "moralizing",
1034
- "motorised": "motorized",
1035
- "mould": "mold",
1036
- "moulded": "molded",
1037
- "moulder": "molder",
1038
- "mouldered": "moldered",
1039
- "mouldering": "moldering",
1040
- "moulders": "molders",
1041
- "mouldier": "moldier",
1042
- "mouldiest": "moldiest",
1043
- "moulding": "molding",
1044
- "mouldings": "moldings",
1045
- "moulds": "molds",
1046
- "mouldy": "moldy",
1047
- "moult": "molt",
1048
- "moulted": "molted",
1049
- "moulting": "molting",
1050
- "moults": "molts",
1051
- "moustache": "mustache",
1052
- "moustached": "mustached",
1053
- "moustaches": "mustaches",
1054
- "moustachioed": "mustachioed",
1055
- "multicoloured": "multicolored",
1056
- "nationalisation": "nationalization",
1057
- "nationalisations": "nationalizations",
1058
- "nationalise": "nationalize",
1059
- "nationalised": "nationalized",
1060
- "nationalises": "nationalizes",
1061
- "nationalising": "nationalizing",
1062
- "naturalisation": "naturalization",
1063
- "naturalise": "naturalize",
1064
- "naturalised": "naturalized",
1065
- "naturalises": "naturalizes",
1066
- "naturalising": "naturalizing",
1067
- "neighbour": "neighbor",
1068
- "neighbourhood": "neighborhood",
1069
- "neighbourhoods": "neighborhoods",
1070
- "neighbouring": "neighboring",
1071
- "neighbourliness": "neighborliness",
1072
- "neighbourly": "neighborly",
1073
- "neighbours": "neighbors",
1074
- "neutralisation": "neutralization",
1075
- "neutralise": "neutralize",
1076
- "neutralised": "neutralized",
1077
- "neutralises": "neutralizes",
1078
- "neutralising": "neutralizing",
1079
- "normalisation": "normalization",
1080
- "normalise": "normalize",
1081
- "normalised": "normalized",
1082
- "normalises": "normalizes",
1083
- "normalising": "normalizing",
1084
- "odour": "odor",
1085
- "odourless": "odorless",
1086
- "odours": "odors",
1087
- "oesophagus": "esophagus",
1088
- "oesophaguses": "esophaguses",
1089
- "oestrogen": "estrogen",
1090
- "offence": "offense",
1091
- "offences": "offenses",
1092
- "omelette": "omelet",
1093
- "omelettes": "omelets",
1094
- "optimise": "optimize",
1095
- "optimised": "optimized",
1096
- "optimises": "optimizes",
1097
- "optimising": "optimizing",
1098
- "organisation": "organization",
1099
- "organisational": "organizational",
1100
- "organisations": "organizations",
1101
- "organise": "organize",
1102
- "organised": "organized",
1103
- "organiser": "organizer",
1104
- "organisers": "organizers",
1105
- "organises": "organizes",
1106
- "organising": "organizing",
1107
- "orthopaedic": "orthopedic",
1108
- "orthopaedics": "orthopedics",
1109
- "ostracise": "ostracize",
1110
- "ostracised": "ostracized",
1111
- "ostracises": "ostracizes",
1112
- "ostracising": "ostracizing",
1113
- "outmanoeuvre": "outmaneuver",
1114
- "outmanoeuvred": "outmaneuvered",
1115
- "outmanoeuvres": "outmaneuvers",
1116
- "outmanoeuvring": "outmaneuvering",
1117
- "overemphasise": "overemphasize",
1118
- "overemphasised": "overemphasized",
1119
- "overemphasises": "overemphasizes",
1120
- "overemphasising": "overemphasizing",
1121
- "oxidisation": "oxidization",
1122
- "oxidise": "oxidize",
1123
- "oxidised": "oxidized",
1124
- "oxidises": "oxidizes",
1125
- "oxidising": "oxidizing",
1126
- "paederast": "pederast",
1127
- "paederasts": "pederasts",
1128
- "paediatric": "pediatric",
1129
- "paediatrician": "pediatrician",
1130
- "paediatricians": "pediatricians",
1131
- "paediatrics": "pediatrics",
1132
- "paedophile": "pedophile",
1133
- "paedophiles": "pedophiles",
1134
- "paedophilia": "pedophilia",
1135
- "palaeolithic": "paleolithic",
1136
- "palaeontologist": "paleontologist",
1137
- "palaeontologists": "paleontologists",
1138
- "palaeontology": "paleontology",
1139
- "panelled": "paneled",
1140
- "panelling": "paneling",
1141
- "panellist": "panelist",
1142
- "panellists": "panelists",
1143
- "paralyse": "paralyze",
1144
- "paralysed": "paralyzed",
1145
- "paralyses": "paralyzes",
1146
- "paralysing": "paralyzing",
1147
- "parcelled": "parceled",
1148
- "parcelling": "parceling",
1149
- "parlour": "parlor",
1150
- "parlours": "parlors",
1151
- "particularise": "particularize",
1152
- "particularised": "particularized",
1153
- "particularises": "particularizes",
1154
- "particularising": "particularizing",
1155
- "passivisation": "passivization",
1156
- "passivise": "passivize",
1157
- "passivised": "passivized",
1158
- "passivises": "passivizes",
1159
- "passivising": "passivizing",
1160
- "pasteurisation": "pasteurization",
1161
- "pasteurise": "pasteurize",
1162
- "pasteurised": "pasteurized",
1163
- "pasteurises": "pasteurizes",
1164
- "pasteurising": "pasteurizing",
1165
- "patronise": "patronize",
1166
- "patronised": "patronized",
1167
- "patronises": "patronizes",
1168
- "patronising": "patronizing",
1169
- "patronisingly": "patronizingly",
1170
- "pedalled": "pedaled",
1171
- "pedalling": "pedaling",
1172
- "pedestrianisation": "pedestrianization",
1173
- "pedestrianise": "pedestrianize",
1174
- "pedestrianised": "pedestrianized",
1175
- "pedestrianises": "pedestrianizes",
1176
- "pedestrianising": "pedestrianizing",
1177
- "penalise": "penalize",
1178
- "penalised": "penalized",
1179
- "penalises": "penalizes",
1180
- "penalising": "penalizing",
1181
- "pencilled": "penciled",
1182
- "pencilling": "penciling",
1183
- "personalise": "personalize",
1184
- "personalised": "personalized",
1185
- "personalises": "personalizes",
1186
- "personalising": "personalizing",
1187
- "pharmacopoeia": "pharmacopeia",
1188
- "pharmacopoeias": "pharmacopeias",
1189
- "philosophise": "philosophize",
1190
- "philosophised": "philosophized",
1191
- "philosophises": "philosophizes",
1192
- "philosophising": "philosophizing",
1193
- "philtre": "filter",
1194
- "philtres": "filters",
1195
- "phoney": "phony",
1196
- "plagiarise": "plagiarize",
1197
- "plagiarised": "plagiarized",
1198
- "plagiarises": "plagiarizes",
1199
- "plagiarising": "plagiarizing",
1200
- "plough": "plow",
1201
- "ploughed": "plowed",
1202
- "ploughing": "plowing",
1203
- "ploughman": "plowman",
1204
- "ploughmen": "plowmen",
1205
- "ploughs": "plows",
1206
- "ploughshare": "plowshare",
1207
- "ploughshares": "plowshares",
1208
- "polarisation": "polarization",
1209
- "polarise": "polarize",
1210
- "polarised": "polarized",
1211
- "polarises": "polarizes",
1212
- "polarising": "polarizing",
1213
- "politicisation": "politicization",
1214
- "politicise": "politicize",
1215
- "politicised": "politicized",
1216
- "politicises": "politicizes",
1217
- "politicising": "politicizing",
1218
- "popularisation": "popularization",
1219
- "popularise": "popularize",
1220
- "popularised": "popularized",
1221
- "popularises": "popularizes",
1222
- "popularising": "popularizing",
1223
- "pouffe": "pouf",
1224
- "pouffes": "poufs",
1225
- "practise": "practice",
1226
- "practised": "practiced",
1227
- "practises": "practices",
1228
- "practising": "practicing",
1229
- "praesidium": "presidium",
1230
- "praesidiums": "presidiums",
1231
- "pressurisation": "pressurization",
1232
- "pressurise": "pressurize",
1233
- "pressurised": "pressurized",
1234
- "pressurises": "pressurizes",
1235
- "pressurising": "pressurizing",
1236
- "pretence": "pretense",
1237
- "pretences": "pretenses",
1238
- "primaeval": "primeval",
1239
- "prioritisation": "prioritization",
1240
- "prioritise": "prioritize",
1241
- "prioritised": "prioritized",
1242
- "prioritises": "prioritizes",
1243
- "prioritising": "prioritizing",
1244
- "privatisation": "privatization",
1245
- "privatisations": "privatizations",
1246
- "privatise": "privatize",
1247
- "privatised": "privatized",
1248
- "privatises": "privatizes",
1249
- "privatising": "privatizing",
1250
- "professionalisation": "professionalization",
1251
- "professionalise": "professionalize",
1252
- "professionalised": "professionalized",
1253
- "professionalises": "professionalizes",
1254
- "professionalising": "professionalizing",
1255
- "programme": "program",
1256
- "programmes": "programs",
1257
- "prologue": "prolog",
1258
- "prologues": "prologs",
1259
- "propagandise": "propagandize",
1260
- "propagandised": "propagandized",
1261
- "propagandises": "propagandizes",
1262
- "propagandising": "propagandizing",
1263
- "proselytise": "proselytize",
1264
- "proselytised": "proselytized",
1265
- "proselytiser": "proselytizer",
1266
- "proselytisers": "proselytizers",
1267
- "proselytises": "proselytizes",
1268
- "proselytising": "proselytizing",
1269
- "psychoanalyse": "psychoanalyze",
1270
- "psychoanalysed": "psychoanalyzed",
1271
- "psychoanalyses": "psychoanalyzes",
1272
- "psychoanalysing": "psychoanalyzing",
1273
- "publicise": "publicize",
1274
- "publicised": "publicized",
1275
- "publicises": "publicizes",
1276
- "publicising": "publicizing",
1277
- "pulverisation": "pulverization",
1278
- "pulverise": "pulverize",
1279
- "pulverised": "pulverized",
1280
- "pulverises": "pulverizes",
1281
- "pulverising": "pulverizing",
1282
- "pummelled": "pummel",
1283
- "pummelling": "pummeled",
1284
- "pyjama": "pajama",
1285
- "pyjamas": "pajamas",
1286
- "pzazz": "pizzazz",
1287
- "quarrelled": "quarreled",
1288
- "quarrelling": "quarreling",
1289
- "radicalise": "radicalize",
1290
- "radicalised": "radicalized",
1291
- "radicalises": "radicalizes",
1292
- "radicalising": "radicalizing",
1293
- "rancour": "rancor",
1294
- "randomise": "randomize",
1295
- "randomised": "randomized",
1296
- "randomises": "randomizes",
1297
- "randomising": "randomizing",
1298
- "rationalisation": "rationalization",
1299
- "rationalisations": "rationalizations",
1300
- "rationalise": "rationalize",
1301
- "rationalised": "rationalized",
1302
- "rationalises": "rationalizes",
1303
- "rationalising": "rationalizing",
1304
- "ravelled": "raveled",
1305
- "ravelling": "raveling",
1306
- "realisable": "realizable",
1307
- "realisation": "realization",
1308
- "realisations": "realizations",
1309
- "realise": "realize",
1310
- "realised": "realized",
1311
- "realises": "realizes",
1312
- "realising": "realizing",
1313
- "recognisable": "recognizable",
1314
- "recognisably": "recognizably",
1315
- "recognisance": "recognizance",
1316
- "recognise": "recognize",
1317
- "recognised": "recognized",
1318
- "recognises": "recognizes",
1319
- "recognising": "recognizing",
1320
- "reconnoitre": "reconnoiter",
1321
- "reconnoitred": "reconnoitered",
1322
- "reconnoitres": "reconnoiters",
1323
- "reconnoitring": "reconnoitering",
1324
- "refuelled": "refueled",
1325
- "refuelling": "refueling",
1326
- "regularisation": "regularization",
1327
- "regularise": "regularize",
1328
- "regularised": "regularized",
1329
- "regularises": "regularizes",
1330
- "regularising": "regularizing",
1331
- "remodelled": "remodeled",
1332
- "remodelling": "remodeling",
1333
- "remould": "remold",
1334
- "remoulded": "remolded",
1335
- "remoulding": "remolding",
1336
- "remoulds": "remolds",
1337
- "reorganisation": "reorganization",
1338
- "reorganisations": "reorganizations",
1339
- "reorganise": "reorganize",
1340
- "reorganised": "reorganized",
1341
- "reorganises": "reorganizes",
1342
- "reorganising": "reorganizing",
1343
- "revelled": "reveled",
1344
- "reveller": "reveler",
1345
- "revellers": "revelers",
1346
- "revelling": "reveling",
1347
- "revitalise": "revitalize",
1348
- "revitalised": "revitalized",
1349
- "revitalises": "revitalizes",
1350
- "revitalising": "revitalizing",
1351
- "revolutionise": "revolutionize",
1352
- "revolutionised": "revolutionized",
1353
- "revolutionises": "revolutionizes",
1354
- "revolutionising": "revolutionizing",
1355
- "rhapsodise": "rhapsodize",
1356
- "rhapsodised": "rhapsodized",
1357
- "rhapsodises": "rhapsodizes",
1358
- "rhapsodising": "rhapsodizing",
1359
- "rigour": "rigor",
1360
- "rigours": "rigors",
1361
- "ritualised": "ritualized",
1362
- "rivalled": "rivaled",
1363
- "rivalling": "rivaling",
1364
- "romanticise": "romanticize",
1365
- "romanticised": "romanticized",
1366
- "romanticises": "romanticizes",
1367
- "romanticising": "romanticizing",
1368
- "rumour": "rumor",
1369
- "rumoured": "rumored",
1370
- "rumours": "rumors",
1371
- "sabre": "saber",
1372
- "sabres": "sabers",
1373
- "saltpetre": "saltpeter",
1374
- "sanitise": "sanitize",
1375
- "sanitised": "sanitized",
1376
- "sanitises": "sanitizes",
1377
- "sanitising": "sanitizing",
1378
- "satirise": "satirize",
1379
- "satirised": "satirized",
1380
- "satirises": "satirizes",
1381
- "satirising": "satirizing",
1382
- "saviour": "savior",
1383
- "saviours": "saviors",
1384
- "savour": "savor",
1385
- "savoured": "savored",
1386
- "savouries": "savories",
1387
- "savouring": "savoring",
1388
- "savours": "savors",
1389
- "savoury": "savory",
1390
- "scandalise": "scandalize",
1391
- "scandalised": "scandalized",
1392
- "scandalises": "scandalizes",
1393
- "scandalising": "scandalizing",
1394
- "sceptic": "skeptic",
1395
- "sceptical": "skeptical",
1396
- "sceptically": "skeptically",
1397
- "scepticism": "skepticism",
1398
- "sceptics": "skeptics",
1399
- "sceptre": "scepter",
1400
- "sceptres": "scepters",
1401
- "scrutinise": "scrutinize",
1402
- "scrutinised": "scrutinized",
1403
- "scrutinises": "scrutinizes",
1404
- "scrutinising": "scrutinizing",
1405
- "secularisation": "secularization",
1406
- "secularise": "secularize",
1407
- "secularised": "secularized",
1408
- "secularises": "secularizes",
1409
- "secularising": "secularizing",
1410
- "sensationalise": "sensationalize",
1411
- "sensationalised": "sensationalized",
1412
- "sensationalises": "sensationalizes",
1413
- "sensationalising": "sensationalizing",
1414
- "sensitise": "sensitize",
1415
- "sensitised": "sensitized",
1416
- "sensitises": "sensitizes",
1417
- "sensitising": "sensitizing",
1418
- "sentimentalise": "sentimentalize",
1419
- "sentimentalised": "sentimentalized",
1420
- "sentimentalises": "sentimentalizes",
1421
- "sentimentalising": "sentimentalizing",
1422
- "sepulchre": "sepulcher",
1423
- "sepulchres": "sepulchers",
1424
- "serialisation": "serialization",
1425
- "serialisations": "serializations",
1426
- "serialise": "serialize",
1427
- "serialised": "serialized",
1428
- "serialises": "serializes",
1429
- "serialising": "serializing",
1430
- "sermonise": "sermonize",
1431
- "sermonised": "sermonized",
1432
- "sermonises": "sermonizes",
1433
- "sermonising": "sermonizing",
1434
- "sheikh": "sheik",
1435
- "shovelled": "shoveled",
1436
- "shovelling": "shoveling",
1437
- "shrivelled": "shriveled",
1438
- "shrivelling": "shriveling",
1439
- "signalise": "signalize",
1440
- "signalised": "signalized",
1441
- "signalises": "signalizes",
1442
- "signalising": "signalizing",
1443
- "signalled": "signaled",
1444
- "signalling": "signaling",
1445
- "smoulder": "smolder",
1446
- "smouldered": "smoldered",
1447
- "smouldering": "smoldering",
1448
- "smoulders": "smolders",
1449
- "snivelled": "sniveled",
1450
- "snivelling": "sniveling",
1451
- "snorkelled": "snorkeled",
1452
- "snorkelling": "snorkeling",
1453
- "snowplough": "snowplow",
1454
- "snowploughs": "snowplow",
1455
- "socialisation": "socialization",
1456
- "socialise": "socialize",
1457
- "socialised": "socialized",
1458
- "socialises": "socializes",
1459
- "socialising": "socializing",
1460
- "sodomise": "sodomize",
1461
- "sodomised": "sodomized",
1462
- "sodomises": "sodomizes",
1463
- "sodomising": "sodomizing",
1464
- "solemnise": "solemnize",
1465
- "solemnised": "solemnized",
1466
- "solemnises": "solemnizes",
1467
- "solemnising": "solemnizing",
1468
- "sombre": "somber",
1469
- "specialisation": "specialization",
1470
- "specialisations": "specializations",
1471
- "specialise": "specialize",
1472
- "specialised": "specialized",
1473
- "specialises": "specializes",
1474
- "specialising": "specializing",
1475
- "spectre": "specter",
1476
- "spectres": "specters",
1477
- "spiralled": "spiraled",
1478
- "spiralling": "spiraling",
1479
- "splendour": "splendor",
1480
- "splendours": "splendors",
1481
- "squirrelled": "squirreled",
1482
- "squirrelling": "squirreling",
1483
- "stabilisation": "stabilization",
1484
- "stabilise": "stabilize",
1485
- "stabilised": "stabilized",
1486
- "stabiliser": "stabilizer",
1487
- "stabilisers": "stabilizers",
1488
- "stabilises": "stabilizes",
1489
- "stabilising": "stabilizing",
1490
- "standardisation": "standardization",
1491
- "standardise": "standardize",
1492
- "standardised": "standardized",
1493
- "standardises": "standardizes",
1494
- "standardising": "standardizing",
1495
- "stencilled": "stenciled",
1496
- "stencilling": "stenciling",
1497
- "sterilisation": "sterilization",
1498
- "sterilisations": "sterilizations",
1499
- "sterilise": "sterilize",
1500
- "sterilised": "sterilized",
1501
- "steriliser": "sterilizer",
1502
- "sterilisers": "sterilizers",
1503
- "sterilises": "sterilizes",
1504
- "sterilising": "sterilizing",
1505
- "stigmatisation": "stigmatization",
1506
- "stigmatise": "stigmatize",
1507
- "stigmatised": "stigmatized",
1508
- "stigmatises": "stigmatizes",
1509
- "stigmatising": "stigmatizing",
1510
- "storey": "story",
1511
- "storeys": "stories",
1512
- "subsidisation": "subsidization",
1513
- "subsidise": "subsidize",
1514
- "subsidised": "subsidized",
1515
- "subsidiser": "subsidizer",
1516
- "subsidisers": "subsidizers",
1517
- "subsidises": "subsidizes",
1518
- "subsidising": "subsidizing",
1519
- "succour": "succor",
1520
- "succoured": "succored",
1521
- "succouring": "succoring",
1522
- "succours": "succors",
1523
- "sulphate": "sulfate",
1524
- "sulphates": "sulfates",
1525
- "sulphide": "sulfide",
1526
- "sulphides": "sulfides",
1527
- "sulphur": "sulfur",
1528
- "sulphurous": "sulfurous",
1529
- "summarise": "summarize",
1530
- "summarised": "summarized",
1531
- "summarises": "summarizes",
1532
- "summarising": "summarizing",
1533
- "swivelled": "swiveled",
1534
- "swivelling": "swiveling",
1535
- "symbolise": "symbolize",
1536
- "symbolised": "symbolized",
1537
- "symbolises": "symbolizes",
1538
- "symbolising": "symbolizing",
1539
- "sympathise": "sympathize",
1540
- "sympathised": "sympathized",
1541
- "sympathiser": "sympathizer",
1542
- "sympathisers": "sympathizers",
1543
- "sympathises": "sympathizes",
1544
- "sympathising": "sympathizing",
1545
- "synchronisation": "synchronization",
1546
- "synchronise": "synchronize",
1547
- "synchronised": "synchronized",
1548
- "synchronises": "synchronizes",
1549
- "synchronising": "synchronizing",
1550
- "synthesise": "synthesize",
1551
- "synthesised": "synthesized",
1552
- "synthesiser": "synthesizer",
1553
- "synthesisers": "synthesizers",
1554
- "synthesises": "synthesizes",
1555
- "synthesising": "synthesizing",
1556
- "syphon": "siphon",
1557
- "syphoned": "siphoned",
1558
- "syphoning": "siphoning",
1559
- "syphons": "siphons",
1560
- "systematisation": "systematization",
1561
- "systematise": "systematize",
1562
- "systematised": "systematized",
1563
- "systematises": "systematizes",
1564
- "systematising": "systematizing",
1565
- "tantalise": "tantalize",
1566
- "tantalised": "tantalized",
1567
- "tantalises": "tantalizes",
1568
- "tantalising": "tantalizing",
1569
- "tantalisingly": "tantalizingly",
1570
- "tasselled": "tasseled",
1571
- "technicolour": "technicolor",
1572
- "temporise": "temporize",
1573
- "temporised": "temporized",
1574
- "temporises": "temporizes",
1575
- "temporising": "temporizing",
1576
- "tenderise": "tenderize",
1577
- "tenderised": "tenderized",
1578
- "tenderises": "tenderizes",
1579
- "tenderising": "tenderizing",
1580
- "terrorise": "terrorize",
1581
- "terrorised": "terrorized",
1582
- "terrorises": "terrorizes",
1583
- "terrorising": "terrorizing",
1584
- "theatre": "theater",
1585
- "theatregoer": "theatergoer",
1586
- "theatregoers": "theatergoers",
1587
- "theatres": "theaters",
1588
- "theorise": "theorize",
1589
- "theorised": "theorized",
1590
- "theorises": "theorizes",
1591
- "theorising": "theorizing",
1592
- "tonne": "ton",
1593
- "tonnes": "tons",
1594
- "towelled": "toweled",
1595
- "towelling": "toweling",
1596
- "toxaemia": "toxemia",
1597
- "tranquillise": "tranquilize",
1598
- "tranquillised": "tranquilized",
1599
- "tranquilliser": "tranquilizer",
1600
- "tranquillisers": "tranquilizers",
1601
- "tranquillises": "tranquilizes",
1602
- "tranquillising": "tranquilizing",
1603
- "tranquillity": "tranquility",
1604
- "tranquillize": "tranquilize",
1605
- "tranquillized": "tranquilized",
1606
- "tranquillizer": "tranquilizer",
1607
- "tranquillizers": "tranquilizers",
1608
- "tranquillizes": "tranquilizes",
1609
- "tranquillizing": "tranquilizing",
1610
- "tranquilly": "tranquility",
1611
- "transistorised": "transistorized",
1612
- "traumatise": "traumatize",
1613
- "traumatised": "traumatized",
1614
- "traumatises": "traumatizes",
1615
- "traumatising": "traumatizing",
1616
- "travelled": "traveled",
1617
- "traveller": "traveler",
1618
- "travellers": "travelers",
1619
- "travelling": "traveling",
1620
- "travelog": "travelogue",
1621
- "travelogs": "travelogues",
1622
- "trialled": "trialed",
1623
- "trialling": "trialing",
1624
- "tricolour": "tricolor",
1625
- "tricolours": "tricolors",
1626
- "trivialise": "trivialize",
1627
- "trivialised": "trivialized",
1628
- "trivialises": "trivializes",
1629
- "trivialising": "trivializing",
1630
- "tumour": "tumor",
1631
- "tumours": "tumors",
1632
- "tunnelled": "tunneled",
1633
- "tunnelling": "tunneling",
1634
- "tyrannise": "tyrannize",
1635
- "tyrannised": "tyrannized",
1636
- "tyrannises": "tyrannizes",
1637
- "tyrannising": "tyrannizing",
1638
- "tyre": "tire",
1639
- "tyres": "tires",
1640
- "unauthorised": "unauthorized",
1641
- "uncivilised": "uncivilized",
1642
- "underutilised": "underutilized",
1643
- "unequalled": "unequaled",
1644
- "unfavourable": "unfavorable",
1645
- "unfavourably": "unfavorably",
1646
- "unionisation": "unionization",
1647
- "unionise": "unionize",
1648
- "unionised": "unionized",
1649
- "unionises": "unionizes",
1650
- "unionising": "unionizing",
1651
- "unorganised": "unorganized",
1652
- "unravelled": "unraveled",
1653
- "unravelling": "unraveling",
1654
- "unrecognisable": "unrecognizable",
1655
- "unrecognised": "unrecognized",
1656
- "unrivalled": "unrivaled",
1657
- "unsavoury": "unsavory",
1658
- "untrammelled": "untrammeled",
1659
- "urbanisation": "urbanization",
1660
- "urbanise": "urbanize",
1661
- "urbanised": "urbanized",
1662
- "urbanises": "urbanizes",
1663
- "urbanising": "urbanizing",
1664
- "utilisable": "utilizable",
1665
- "utilisation": "utilization",
1666
- "utilise": "utilize",
1667
- "utilised": "utilized",
1668
- "utilises": "utilizes",
1669
- "utilising": "utilizing",
1670
- "valour": "valor",
1671
- "vandalise": "vandalize",
1672
- "vandalised": "vandalized",
1673
- "vandalises": "vandalizes",
1674
- "vandalising": "vandalizing",
1675
- "vaporisation": "vaporization",
1676
- "vaporise": "vaporize",
1677
- "vaporised": "vaporized",
1678
- "vaporises": "vaporizes",
1679
- "vaporising": "vaporizing",
1680
- "vapour": "vapor",
1681
- "vapours": "vapors",
1682
- "verbalise": "verbalize",
1683
- "verbalised": "verbalized",
1684
- "verbalises": "verbalizes",
1685
- "verbalising": "verbalizing",
1686
- "victimisation": "victimization",
1687
- "victimise": "victimize",
1688
- "victimised": "victimized",
1689
- "victimises": "victimizes",
1690
- "victimising": "victimizing",
1691
- "videodisc": "videodisk",
1692
- "videodiscs": "videodisks",
1693
- "vigour": "vigor",
1694
- "visualisation": "visualization",
1695
- "visualisations": "visualizations",
1696
- "visualise": "visualize",
1697
- "visualised": "visualized",
1698
- "visualises": "visualizes",
1699
- "visualising": "visualizing",
1700
- "vocalisation": "vocalization",
1701
- "vocalisations": "vocalizations",
1702
- "vocalise": "vocalize",
1703
- "vocalised": "vocalized",
1704
- "vocalises": "vocalizes",
1705
- "vocalising": "vocalizing",
1706
- "vulcanised": "vulcanized",
1707
- "vulgarisation": "vulgarization",
1708
- "vulgarise": "vulgarize",
1709
- "vulgarised": "vulgarized",
1710
- "vulgarises": "vulgarizes",
1711
- "vulgarising": "vulgarizing",
1712
- "waggon": "wagon",
1713
- "waggons": "wagons",
1714
- "watercolour": "watercolor",
1715
- "watercolours": "watercolors",
1716
- "weaselled": "weaseled",
1717
- "weaselling": "weaseling",
1718
- "westernisation": "westernization",
1719
- "westernise": "westernize",
1720
- "westernised": "westernized",
1721
- "westernises": "westernizes",
1722
- "westernising": "westernizing",
1723
- "womanise": "womanize",
1724
- "womanised": "womanized",
1725
- "womaniser": "womanizer",
1726
- "womanisers": "womanizers",
1727
- "womanises": "womanizes",
1728
- "womanising": "womanizing",
1729
- "woollen": "woolen",
1730
- "woollens": "woolens",
1731
- "woollies": "woolies",
1732
- "woolly": "wooly",
1733
- "worshipped": "worshiped",
1734
- "worshipper": "worshiper",
1735
- "worshipping": "worshiping",
1736
- "yodelled": "yodeled",
1737
- "yodelling": "yodeling",
1738
- "yoghourt": "yogurt",
1739
- "yoghourts": "yogurts",
1740
- "yoghurt": "yogurt",
1741
- "yoghurts": "yogurts"
1742
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f8b7db43722c09d7b27c717393cd01d6cbbb0a0bfed84454c6a435e84f2c91e3
3
  size 967102601
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70a0558d32f090315b932d793e742d46101a6286e87e680c5fecb4a2c0ed862e
3
  size 967102601
runs/May15_12-08-38_DESKTOP-OD7C1Q6/1684130924.7925029/events.out.tfevents.1684130924.DESKTOP-OD7C1Q6 DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:fe9bb07ee7147ed13370775248e8175483467d394f172e9df238681872eb6fdb
3
- size 5703
 
 
 
 
runs/May15_12-08-38_DESKTOP-OD7C1Q6/events.out.tfevents.1684130924.DESKTOP-OD7C1Q6 DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:71fd799105968dd35d677c29854f23281e86af2c6d3f7bbed8c24da422c9f048
3
- size 4653
 
 
 
 
runs/May15_12-15-25_DESKTOP-OD7C1Q6/1684131331.9202273/events.out.tfevents.1684131331.DESKTOP-OD7C1Q6 DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:995a70cbd10c9b915a4f03748e27c73a22c77ffd02c4f73e76d933de2d638600
3
- size 5703
 
 
 
 
runs/May15_12-15-25_DESKTOP-OD7C1Q6/events.out.tfevents.1684131331.DESKTOP-OD7C1Q6 DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:9591d48d0b369e45899d52da758713c70d27066f1fe17d2dc1734ab6622567a4
3
- size 4653
 
 
 
 
runs/May15_13-19-50_DESKTOP-OD7C1Q6/1684135196.836124/events.out.tfevents.1684135196.DESKTOP-OD7C1Q6 DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:3d6332a943560b994b9e1c5e6fea83e2dbdfbfc566ec1f3c3487dbad891fc685
3
- size 5703
 
 
 
 
runs/May15_13-19-50_DESKTOP-OD7C1Q6/events.out.tfevents.1684135196.DESKTOP-OD7C1Q6 DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:fe27f44c89226fe5ca8a0f988fc02e971cca6d52aab2909f258876b025018a19
3
- size 4653
 
 
 
 
runs/May15_13-32-25_DESKTOP-OD7C1Q6/1684135953.274833/events.out.tfevents.1684135953.DESKTOP-OD7C1Q6 DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:c9922d8fc99c889753ff3f067c78ba4d3a11a47b9f3daecdce75d8ed0a78066e
3
- size 5703
 
 
 
 
runs/May15_13-32-25_DESKTOP-OD7C1Q6/events.out.tfevents.1684135953.DESKTOP-OD7C1Q6 DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:95377feb15e59e0a2f1d3ab8f81cbc31e0a49d1f3012e6d07681da11dc886a0b
3
- size 4653
 
 
 
 
runs/May15_14-04-02_DESKTOP-OD7C1Q6/1684137848.1832855/events.out.tfevents.1684137848.DESKTOP-OD7C1Q6 DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:213d087e3fb61f154c8694c09d30bad5bc3109226fa1d9e566507382d0ae45ac
3
- size 5703
 
 
 
 
runs/May15_14-04-02_DESKTOP-OD7C1Q6/events.out.tfevents.1684137848.DESKTOP-OD7C1Q6 DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:7758c998ec59f03b698b9a3b2ff1658d99c5ad33b25f4b80a6812c8704330234
3
- size 4653
 
 
 
 
runs/May15_14-48-43_DESKTOP-OD7C1Q6/1684140528.8114798/events.out.tfevents.1684140528.DESKTOP-OD7C1Q6 DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:90a6ecc9f4a4c81927451d61f7496b6ec064be68188e9a7cb73f32db8a39d440
3
- size 5703
 
 
 
 
runs/May15_14-48-43_DESKTOP-OD7C1Q6/events.out.tfevents.1684140528.DESKTOP-OD7C1Q6 DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:0b4846721872455fd2d2ff248594f373c2fcbb7033960a086c99d64ca397b51e
3
- size 4651
 
 
 
 
runs/May15_14-59-56_DESKTOP-OD7C1Q6/1684141202.0174327/events.out.tfevents.1684141202.DESKTOP-OD7C1Q6 DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:af86acda2ac7b5492bc1b3dfc2156f198c0bedf8169be3a02e4c522d93967cc0
3
- size 5703
 
 
 
 
runs/May15_14-59-56_DESKTOP-OD7C1Q6/events.out.tfevents.1684141202.DESKTOP-OD7C1Q6 DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:11bcb7ce9661734f1b0632c3bced8caceffa4bc12d7e2bcda30ba9676a9e1579
3
- size 4651
 
 
 
 
runs/May15_15-12-20_DESKTOP-OD7C1Q6/1684141947.2878134/events.out.tfevents.1684141947.DESKTOP-OD7C1Q6 DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:fbc6a7bb119f6716a0f6973d4581c27d654a865cbb15222f5e8c7aec7dbc3219
3
- size 5703
 
 
 
 
runs/May15_15-12-20_DESKTOP-OD7C1Q6/events.out.tfevents.1684141947.DESKTOP-OD7C1Q6 DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:895a151daf82bdf531cbe4831fcf8d893b9d259cd6e658799427af55a66543a0
3
- size 4651
 
 
 
 
runs/May15_15-29-19_DESKTOP-OD7C1Q6/1684142964.8228638/events.out.tfevents.1684142964.DESKTOP-OD7C1Q6 DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:6b32d2bb64351a9127b77d7aa942ea6ebad69ebfedf460670004aad6b50f5c4f
3
- size 5703
 
 
 
 
runs/May15_15-29-19_DESKTOP-OD7C1Q6/events.out.tfevents.1684142964.DESKTOP-OD7C1Q6 DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:878bc7a54e38676db288d52bc9e371752ce156e84aeb59c75ba2d4849aac0d51
3
- size 4652
 
 
 
 
runs/May15_15-47-11_DESKTOP-OD7C1Q6/1684144037.0687504/events.out.tfevents.1684144037.DESKTOP-OD7C1Q6 DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:047eac77f0811a1700aa302de08a6039dbef0aebe4ce56344ead0062a466104e
3
- size 5703
 
 
 
 
runs/May15_15-47-11_DESKTOP-OD7C1Q6/events.out.tfevents.1684144037.DESKTOP-OD7C1Q6 DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:0d450b8be43c3c9af390685b9f4c2c389f884b6d76e24b074f75f69fb6aafd00
3
- size 5305
 
 
 
 
runs/May15_15-47-11_DESKTOP-OD7C1Q6/events.out.tfevents.1684144731.DESKTOP-OD7C1Q6 DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:2aef58d48fc6abdae3c1509a074d50455a62a6510ae62a0eb8365f93862817d7
3
- size 40
 
 
 
 
runs/{May13_23-09-22_DESKTOP-OD7C1Q6/1683997770.2403045/events.out.tfevents.1683997770.DESKTOP-OD7C1Q6 → May15_16-55-04_DESKTOP-OD7C1Q6/1684148109.9478214/events.out.tfevents.1684148109.DESKTOP-OD7C1Q6} RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c4b1ab019a8e871e28c10a48cdb1416e162572c30d2af32033600a2fc2991bfa
3
- size 5703
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fbd2d3c6d2a78470ee2e09b7e00686e640c9a5c821bf5ef7d2efd7a1053cad75
3
+ size 5841
runs/{May13_23-09-22_DESKTOP-OD7C1Q6/events.out.tfevents.1683997770.DESKTOP-OD7C1Q6 → May15_16-55-04_DESKTOP-OD7C1Q6/events.out.tfevents.1684148109.DESKTOP-OD7C1Q6} RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:606040c60ee7708fa1dbad905eca79a7cc664c90dbdcffcd12bad8348a09e774
3
- size 4652
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b36951b2c94b6cd36f420649b1cadfd923728f2888493bb08e5496b19de6884a
3
+ size 8016
runs/{May15_11-17-07_DESKTOP-OD7C1Q6/1684127833.5408869/events.out.tfevents.1684127833.DESKTOP-OD7C1Q6 → May15_22-40-19_DESKTOP-OD7C1Q6/1684168824.9625106/events.out.tfevents.1684168824.DESKTOP-OD7C1Q6} RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:189723d8061b53912805ea4ef9844b48e639b30b44e3f8c96cd157052005777b
3
- size 5703
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7175c9a71b9fc363128a8e188589c9821513a6e490763e38556788f9be25b0e8
3
+ size 5841
runs/{May15_11-17-07_DESKTOP-OD7C1Q6/events.out.tfevents.1684127833.DESKTOP-OD7C1Q6 → May15_22-40-19_DESKTOP-OD7C1Q6/events.out.tfevents.1684168824.DESKTOP-OD7C1Q6} RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:59d8ce96f93a61adef1f60c1ab18d0b1e82e4a5f31ceec9900c5d914b68de370
3
- size 4653
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bfa01668cd97f52fc93b6bfed9c83a78013bc282e264501ef890a1d36706eb00
3
+ size 11364
special_tokens_map.json DELETED
@@ -1,133 +0,0 @@
1
- {
2
- "additional_special_tokens": [
3
- "<|endoftext|>",
4
- "<|startoftranscript|>",
5
- "<|en|>",
6
- "<|zh|>",
7
- "<|de|>",
8
- "<|es|>",
9
- "<|ru|>",
10
- "<|ko|>",
11
- "<|fr|>",
12
- "<|ja|>",
13
- "<|pt|>",
14
- "<|tr|>",
15
- "<|pl|>",
16
- "<|ca|>",
17
- "<|nl|>",
18
- "<|ar|>",
19
- "<|sv|>",
20
- "<|it|>",
21
- "<|id|>",
22
- "<|hi|>",
23
- "<|fi|>",
24
- "<|vi|>",
25
- "<|he|>",
26
- "<|uk|>",
27
- "<|el|>",
28
- "<|ms|>",
29
- "<|cs|>",
30
- "<|ro|>",
31
- "<|da|>",
32
- "<|hu|>",
33
- "<|ta|>",
34
- "<|no|>",
35
- "<|th|>",
36
- "<|ur|>",
37
- "<|hr|>",
38
- "<|bg|>",
39
- "<|lt|>",
40
- "<|la|>",
41
- "<|mi|>",
42
- "<|ml|>",
43
- "<|cy|>",
44
- "<|sk|>",
45
- "<|te|>",
46
- "<|fa|>",
47
- "<|lv|>",
48
- "<|bn|>",
49
- "<|sr|>",
50
- "<|az|>",
51
- "<|sl|>",
52
- "<|kn|>",
53
- "<|et|>",
54
- "<|mk|>",
55
- "<|br|>",
56
- "<|eu|>",
57
- "<|is|>",
58
- "<|hy|>",
59
- "<|ne|>",
60
- "<|mn|>",
61
- "<|bs|>",
62
- "<|kk|>",
63
- "<|sq|>",
64
- "<|sw|>",
65
- "<|gl|>",
66
- "<|mr|>",
67
- "<|pa|>",
68
- "<|si|>",
69
- "<|km|>",
70
- "<|sn|>",
71
- "<|yo|>",
72
- "<|so|>",
73
- "<|af|>",
74
- "<|oc|>",
75
- "<|ka|>",
76
- "<|be|>",
77
- "<|tg|>",
78
- "<|sd|>",
79
- "<|gu|>",
80
- "<|am|>",
81
- "<|yi|>",
82
- "<|lo|>",
83
- "<|uz|>",
84
- "<|fo|>",
85
- "<|ht|>",
86
- "<|ps|>",
87
- "<|tk|>",
88
- "<|nn|>",
89
- "<|mt|>",
90
- "<|sa|>",
91
- "<|lb|>",
92
- "<|my|>",
93
- "<|bo|>",
94
- "<|tl|>",
95
- "<|mg|>",
96
- "<|as|>",
97
- "<|tt|>",
98
- "<|haw|>",
99
- "<|ln|>",
100
- "<|ha|>",
101
- "<|ba|>",
102
- "<|jw|>",
103
- "<|su|>",
104
- "<|translate|>",
105
- "<|transcribe|>",
106
- "<|startoflm|>",
107
- "<|startofprev|>",
108
- "<|nocaptions|>",
109
- "<|notimestamps|>"
110
- ],
111
- "bos_token": {
112
- "content": "<|endoftext|>",
113
- "lstrip": false,
114
- "normalized": true,
115
- "rstrip": false,
116
- "single_word": false
117
- },
118
- "eos_token": {
119
- "content": "<|endoftext|>",
120
- "lstrip": false,
121
- "normalized": true,
122
- "rstrip": false,
123
- "single_word": false
124
- },
125
- "pad_token": "<|endoftext|>",
126
- "unk_token": {
127
- "content": "<|endoftext|>",
128
- "lstrip": false,
129
- "normalized": true,
130
- "rstrip": false,
131
- "single_word": false
132
- }
133
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
tokenizer_config.json DELETED
@@ -1,35 +0,0 @@
1
- {
2
- "add_bos_token": false,
3
- "add_prefix_space": false,
4
- "bos_token": {
5
- "__type": "AddedToken",
6
- "content": "<|endoftext|>",
7
- "lstrip": false,
8
- "normalized": true,
9
- "rstrip": false,
10
- "single_word": false
11
- },
12
- "eos_token": {
13
- "__type": "AddedToken",
14
- "content": "<|endoftext|>",
15
- "lstrip": false,
16
- "normalized": true,
17
- "rstrip": false,
18
- "single_word": false
19
- },
20
- "errors": "replace",
21
- "model_max_length": 1024,
22
- "pad_token": null,
23
- "processor_class": "WhisperProcessor",
24
- "return_attention_mask": false,
25
- "special_tokens_map_file": null,
26
- "tokenizer_class": "WhisperTokenizer",
27
- "unk_token": {
28
- "__type": "AddedToken",
29
- "content": "<|endoftext|>",
30
- "lstrip": false,
31
- "normalized": true,
32
- "rstrip": false,
33
- "single_word": false
34
- }
35
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
train_results.json DELETED
@@ -1,7 +0,0 @@
1
- {
2
- "epoch": 1.31,
3
- "train_loss": 2.721541290283203,
4
- "train_runtime": 665.7853,
5
- "train_samples_per_second": 4.806,
6
- "train_steps_per_second": 0.075
7
- }
 
 
 
 
 
 
 
 
trainer_state.json DELETED
@@ -1,37 +0,0 @@
1
- {
2
- "best_metric": null,
3
- "best_model_checkpoint": null,
4
- "epoch": 1.3114754098360657,
5
- "global_step": 50,
6
- "is_hyper_param_search": false,
7
- "is_local_process_zero": true,
8
- "is_world_process_zero": true,
9
- "log_history": [
10
- {
11
- "epoch": 0.66,
12
- "learning_rate": 2.5000000000000004e-07,
13
- "loss": 2.792,
14
- "step": 25
15
- },
16
- {
17
- "epoch": 1.31,
18
- "learning_rate": 5.000000000000001e-07,
19
- "loss": 2.651,
20
- "step": 50
21
- },
22
- {
23
- "epoch": 1.31,
24
- "step": 50,
25
- "total_flos": 9.2289611022336e+17,
26
- "train_loss": 2.721541290283203,
27
- "train_runtime": 665.7853,
28
- "train_samples_per_second": 4.806,
29
- "train_steps_per_second": 0.075
30
- }
31
- ],
32
- "max_steps": 50,
33
- "num_train_epochs": 2,
34
- "total_flos": 9.2289611022336e+17,
35
- "trial_name": null,
36
- "trial_params": null
37
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:08f2b349d8fb07d165078798d56f36a2b9658e4125b02c036200330e9feede40
3
- size 3643
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c6927498f6d9e476fef21df4100ff020985091bef32f4658d85097f9b619e9cf
3
+ size 4027