jraramhoej commited on
Commit
36a641a
1 Parent(s): af1bbb4

Training in progress, step 1000

Browse files
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "openai/whisper-small",
3
  "activation_dropout": 0.0,
4
  "activation_function": "gelu",
5
  "architectures": [
 
1
  {
2
+ "_name_or_path": "checkpoint-2000",
3
  "activation_dropout": 0.0,
4
  "activation_function": "gelu",
5
  "architectures": [
fine-tune-whisper-streaming.ipynb CHANGED
@@ -154,71 +154,14 @@
154
  "execution_count": 2,
155
  "id": "a2787582-554f-44ce-9f38-4180a5ed6b44",
156
  "metadata": {},
157
- "outputs": [
158
- {
159
- "data": {
160
- "application/vnd.jupyter.widget-view+json": {
161
- "model_id": "a5bfb5c5097d427e97faf28bc5c3aa8a",
162
- "version_major": 2,
163
- "version_minor": 0
164
- },
165
- "text/plain": [
166
- "Downloading builder script: 0%| | 0.00/8.30k [00:00<?, ?B/s]"
167
- ]
168
- },
169
- "metadata": {},
170
- "output_type": "display_data"
171
- },
172
- {
173
- "data": {
174
- "application/vnd.jupyter.widget-view+json": {
175
- "model_id": "86fc1ce2e457497ea0d838ee2221bce4",
176
- "version_major": 2,
177
- "version_minor": 0
178
- },
179
- "text/plain": [
180
- "Downloading readme: 0%| | 0.00/12.2k [00:00<?, ?B/s]"
181
- ]
182
- },
183
- "metadata": {},
184
- "output_type": "display_data"
185
- },
186
- {
187
- "data": {
188
- "application/vnd.jupyter.widget-view+json": {
189
- "model_id": "03d8267a06a5435c8de7726bb0492621",
190
- "version_major": 2,
191
- "version_minor": 0
192
- },
193
- "text/plain": [
194
- "Downloading extra modules: 0%| | 0.00/3.44k [00:00<?, ?B/s]"
195
- ]
196
- },
197
- "metadata": {},
198
- "output_type": "display_data"
199
- },
200
- {
201
- "data": {
202
- "application/vnd.jupyter.widget-view+json": {
203
- "model_id": "67700bc114c74e05b2e8c0fa31ef479c",
204
- "version_major": 2,
205
- "version_minor": 0
206
- },
207
- "text/plain": [
208
- "Downloading extra modules: 0%| | 0.00/60.9k [00:00<?, ?B/s]"
209
- ]
210
- },
211
- "metadata": {},
212
- "output_type": "display_data"
213
- }
214
- ],
215
  "source": [
216
  "from datasets import IterableDatasetDict\n",
217
  "\n",
218
  "raw_datasets = IterableDatasetDict()\n",
219
  "\n",
220
- "raw_datasets[\"train\"] = load_streaming_dataset(\"mozilla-foundation/common_voice_11_0\", \"lt\", split=\"train+validation\", use_auth_token=True) # set split=\"train+validation\" for low-resource\n",
221
- "raw_datasets[\"test\"] = load_streaming_dataset(\"mozilla-foundation/common_voice_11_0\", \"lt\", split=\"test\", use_auth_token=True)"
222
  ]
223
  },
224
  {
@@ -254,110 +197,11 @@
254
  "execution_count": 3,
255
  "id": "77d9f0c5-8607-4642-a8ac-c3ab2e223ea6",
256
  "metadata": {},
257
- "outputs": [
258
- {
259
- "data": {
260
- "application/vnd.jupyter.widget-view+json": {
261
- "model_id": "75b767165e6e43db816df3911cfa841d",
262
- "version_major": 2,
263
- "version_minor": 0
264
- },
265
- "text/plain": [
266
- "Downloading: 0%| | 0.00/185k [00:00<?, ?B/s]"
267
- ]
268
- },
269
- "metadata": {},
270
- "output_type": "display_data"
271
- },
272
- {
273
- "data": {
274
- "application/vnd.jupyter.widget-view+json": {
275
- "model_id": "147d3f2f6bcf46b694088b963c0b8bbb",
276
- "version_major": 2,
277
- "version_minor": 0
278
- },
279
- "text/plain": [
280
- "Downloading: 0%| | 0.00/829 [00:00<?, ?B/s]"
281
- ]
282
- },
283
- "metadata": {},
284
- "output_type": "display_data"
285
- },
286
- {
287
- "data": {
288
- "application/vnd.jupyter.widget-view+json": {
289
- "model_id": "0a2ef4e849214883809f2717e04e8efd",
290
- "version_major": 2,
291
- "version_minor": 0
292
- },
293
- "text/plain": [
294
- "Downloading: 0%| | 0.00/1.04M [00:00<?, ?B/s]"
295
- ]
296
- },
297
- "metadata": {},
298
- "output_type": "display_data"
299
- },
300
- {
301
- "data": {
302
- "application/vnd.jupyter.widget-view+json": {
303
- "model_id": "157bdd4e09944f2fb4a564b5498ac986",
304
- "version_major": 2,
305
- "version_minor": 0
306
- },
307
- "text/plain": [
308
- "Downloading: 0%| | 0.00/494k [00:00<?, ?B/s]"
309
- ]
310
- },
311
- "metadata": {},
312
- "output_type": "display_data"
313
- },
314
- {
315
- "data": {
316
- "application/vnd.jupyter.widget-view+json": {
317
- "model_id": "37577267369d486aaf821fb9b616e54a",
318
- "version_major": 2,
319
- "version_minor": 0
320
- },
321
- "text/plain": [
322
- "Downloading: 0%| | 0.00/52.7k [00:00<?, ?B/s]"
323
- ]
324
- },
325
- "metadata": {},
326
- "output_type": "display_data"
327
- },
328
- {
329
- "data": {
330
- "application/vnd.jupyter.widget-view+json": {
331
- "model_id": "abc2d68feaff450c92d0b2223841d551",
332
- "version_major": 2,
333
- "version_minor": 0
334
- },
335
- "text/plain": [
336
- "Downloading: 0%| | 0.00/2.11k [00:00<?, ?B/s]"
337
- ]
338
- },
339
- "metadata": {},
340
- "output_type": "display_data"
341
- },
342
- {
343
- "data": {
344
- "application/vnd.jupyter.widget-view+json": {
345
- "model_id": "7483217a05e944309128f439da2e0a11",
346
- "version_major": 2,
347
- "version_minor": 0
348
- },
349
- "text/plain": [
350
- "Downloading: 0%| | 0.00/2.06k [00:00<?, ?B/s]"
351
- ]
352
- },
353
- "metadata": {},
354
- "output_type": "display_data"
355
- }
356
- ],
357
  "source": [
358
  "from transformers import WhisperProcessor\n",
359
  "\n",
360
- "processor = WhisperProcessor.from_pretrained(\"openai/whisper-small\", language=\"Lithuanian\", task=\"transcribe\")"
361
  ]
362
  },
363
  {
@@ -715,22 +559,7 @@
715
  "execution_count": 14,
716
  "id": "b22b4011-f31f-4b57-b684-c52332f92890",
717
  "metadata": {},
718
- "outputs": [
719
- {
720
- "data": {
721
- "application/vnd.jupyter.widget-view+json": {
722
- "model_id": "98ab67e0e7c14bbebd4f8526e604c70b",
723
- "version_major": 2,
724
- "version_minor": 0
725
- },
726
- "text/plain": [
727
- "Downloading builder script: 0%| | 0.00/4.49k [00:00<?, ?B/s]"
728
- ]
729
- },
730
- "metadata": {},
731
- "output_type": "display_data"
732
- }
733
- ],
734
  "source": [
735
  "import evaluate\n",
736
  "\n",
@@ -809,40 +638,11 @@
809
  "execution_count": 16,
810
  "id": "5a10cc4b-07ec-4ebd-ac1d-7c601023594f",
811
  "metadata": {},
812
- "outputs": [
813
- {
814
- "data": {
815
- "application/vnd.jupyter.widget-view+json": {
816
- "model_id": "e72a167577c24decbca6625ad8586d16",
817
- "version_major": 2,
818
- "version_minor": 0
819
- },
820
- "text/plain": [
821
- "Downloading: 0%| | 0.00/1.97k [00:00<?, ?B/s]"
822
- ]
823
- },
824
- "metadata": {},
825
- "output_type": "display_data"
826
- },
827
- {
828
- "data": {
829
- "application/vnd.jupyter.widget-view+json": {
830
- "model_id": "b801991734784e80a45e0fa326e29760",
831
- "version_major": 2,
832
- "version_minor": 0
833
- },
834
- "text/plain": [
835
- "Downloading: 0%| | 0.00/967M [00:00<?, ?B/s]"
836
- ]
837
- },
838
- "metadata": {},
839
- "output_type": "display_data"
840
- }
841
- ],
842
  "source": [
843
  "from transformers import WhisperForConditionalGeneration\n",
844
  "\n",
845
- "model = WhisperForConditionalGeneration.from_pretrained(\"openai/whisper-small\")"
846
  ]
847
  },
848
  {
@@ -1065,8 +865,8 @@
1065
  " Gradient Accumulation steps = 1\n",
1066
  " Total optimization steps = 2000\n",
1067
  " Number of trainable parameters = 241734912\n",
1068
- "Reading metadata...: 5194it [00:00, 22097.32it/s]\n",
1069
- "Reading metadata...: 3690it [00:00, 17242.11it/s]\n",
1070
  "The following columns in the training set don't have a corresponding argument in `WhisperForConditionalGeneration.forward` and have been ignored: input_length. If input_length are not expected by `WhisperForConditionalGeneration.forward`, you can safely ignore this message.\n"
1071
  ]
1072
  },
@@ -1076,8 +876,8 @@
1076
  "\n",
1077
  " <div>\n",
1078
  " \n",
1079
- " <progress value='2001' max='2000' style='width:300px; height:20px; vertical-align: middle;'></progress>\n",
1080
- " [2000/2000 4:01:33, Epoch 17.01/9223372036854775807]\n",
1081
  " </div>\n",
1082
  " <table border=\"1\" class=\"dataframe\">\n",
1083
  " <thead>\n",
@@ -1085,16 +885,9 @@
1085
  " <th>Step</th>\n",
1086
  " <th>Training Loss</th>\n",
1087
  " <th>Validation Loss</th>\n",
1088
- " <th>Wer</th>\n",
1089
  " </tr>\n",
1090
  " </thead>\n",
1091
  " <tbody>\n",
1092
- " <tr>\n",
1093
- " <td>1000</td>\n",
1094
- " <td>0.009000</td>\n",
1095
- " <td>0.444009</td>\n",
1096
- " <td>34.279589</td>\n",
1097
- " </tr>\n",
1098
  " </tbody>\n",
1099
  "</table><p>"
1100
  ],
@@ -1109,60 +902,108 @@
1109
  "name": "stderr",
1110
  "output_type": "stream",
1111
  "text": [
1112
- "Reading metadata...: 5194it [00:00, 28115.87it/s]\n",
1113
- "Reading metadata...: 3690it [00:00, 17354.63it/s]\n",
1114
- "Reading metadata...: 5194it [00:00, 22384.93it/s]\n",
1115
- "Reading metadata...: 3690it [00:00, 19621.82it/s]\n",
1116
- "Reading metadata...: 5194it [00:00, 24467.85it/s]\n",
1117
- "Reading metadata...: 3690it [00:00, 25515.20it/s]\n",
1118
- "Reading metadata...: 5194it [00:00, 88011.11it/s]\n",
1119
- "Reading metadata...: 3690it [00:00, 77341.60it/s]\n",
1120
- "Reading metadata...: 5194it [00:00, 77903.11it/s]\n",
1121
- "Reading metadata...: 3690it [00:00, 70552.60it/s]\n",
1122
- "Reading metadata...: 5194it [00:00, 20135.03it/s]\n",
1123
- "Reading metadata...: 3690it [00:00, 16102.97it/s]\n",
1124
- "Reading metadata...: 5194it [00:00, 27943.77it/s]\n",
1125
- "Reading metadata...: 3690it [00:00, 13274.18it/s]\n",
1126
- "Reading metadata...: 5194it [00:00, 57949.57it/s]\n",
1127
- "Reading metadata...: 3690it [00:00, 72940.98it/s]\n",
1128
- "***** Running Evaluation *****\n",
1129
- " Num examples: Unknown\n",
1130
- " Batch size = 8\n",
1131
- "Reading metadata...: 3749it [00:00, 17477.47it/s]\n",
1132
- "The following columns in the evaluation set don't have a corresponding argument in `WhisperForConditionalGeneration.forward` and have been ignored: input_length. If input_length are not expected by `WhisperForConditionalGeneration.forward`, you can safely ignore this message.\n",
1133
- "Saving model checkpoint to ./checkpoint-1000\n",
1134
- "Configuration saved in ./checkpoint-1000/config.json\n",
1135
- "Model weights saved in ./checkpoint-1000/pytorch_model.bin\n",
1136
- "Feature extractor saved in ./checkpoint-1000/preprocessor_config.json\n",
1137
- "tokenizer config file saved in ./checkpoint-1000/tokenizer_config.json\n",
1138
- "Special tokens file saved in ./checkpoint-1000/special_tokens_map.json\n",
1139
- "added tokens file saved in ./checkpoint-1000/added_tokens.json\n",
1140
- "Feature extractor saved in ./preprocessor_config.json\n",
1141
- "tokenizer config file saved in ./tokenizer_config.json\n",
1142
- "Special tokens file saved in ./special_tokens_map.json\n",
1143
- "added tokens file saved in ./added_tokens.json\n",
1144
- "Reading metadata...: 5194it [00:00, 85044.01it/s]\n",
1145
- "Reading metadata...: 3690it [00:00, 74377.46it/s]\n",
1146
- "Reading metadata...: 5194it [00:00, 80124.52it/s]\n",
1147
- "Reading metadata...: 3690it [00:00, 67032.13it/s]\n",
1148
- "Reading metadata...: 5194it [00:00, 71957.77it/s]\n",
1149
- "Reading metadata...: 3690it [00:00, 57010.29it/s]\n",
1150
- "Reading metadata...: 5194it [00:00, 15179.43it/s]\n",
1151
- "Reading metadata...: 3690it [00:00, 11107.82it/s]\n",
1152
- "Reading metadata...: 5194it [00:00, 85555.35it/s]\n",
1153
- "Reading metadata...: 3690it [00:00, 68384.18it/s]\n",
1154
- "Reading metadata...: 5194it [00:00, 18672.38it/s]\n",
1155
- "Reading metadata...: 3690it [00:00, 28625.03it/s]\n",
1156
- "Reading metadata...: 5194it [00:00, 84027.47it/s]\n",
1157
- "Reading metadata...: 3690it [00:00, 62199.27it/s]\n",
1158
- "Reading metadata...: 5194it [00:00, 58151.75it/s]\n",
1159
- "Reading metadata...: 3690it [00:00, 59150.79it/s]\n",
1160
- "Reading metadata...: 5194it [00:00, 83226.87it/s]\n",
1161
- "Reading metadata...: 3690it [00:00, 70468.75it/s]\n",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1162
  "***** Running Evaluation *****\n",
1163
  " Num examples: Unknown\n",
1164
  " Batch size = 8\n",
1165
- "Reading metadata...: 3749it [00:00, 23184.29it/s]\n",
1166
  "The following columns in the evaluation set don't have a corresponding argument in `WhisperForConditionalGeneration.forward` and have been ignored: input_length. If input_length are not expected by `WhisperForConditionalGeneration.forward`, you can safely ignore this message.\n"
1167
  ]
1168
  }
@@ -1201,8 +1042,7 @@
1201
  "kwargs = {\n",
1202
  " \"dataset_tags\": \"mozilla-foundation/common_voice_11_0\",\n",
1203
  " \"dataset\": \"Common Voice 11.0\", # a 'pretty' name for the training dataset\n",
1204
- " \"language\": \"lt\",\n",
1205
- " \"model_name\": \"Whisper Small Lt and Sr\", # a 'pretty' name for your model\n",
1206
  " \"finetuned_from\": \"openai/whisper-small\",\n",
1207
  " \"tasks\": \"automatic-speech-recognition\",\n",
1208
  " \"tags\": \"whisper-event\",\n",
 
154
  "execution_count": 2,
155
  "id": "a2787582-554f-44ce-9f38-4180a5ed6b44",
156
  "metadata": {},
157
+ "outputs": [],
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
158
  "source": [
159
  "from datasets import IterableDatasetDict\n",
160
  "\n",
161
  "raw_datasets = IterableDatasetDict()\n",
162
  "\n",
163
+ "raw_datasets[\"train\"] = load_streaming_dataset(\"mozilla-foundation/common_voice_11_0\", \"sr\", split=\"train+validation\", use_auth_token=True) # set split=\"train+validation\" for low-resource\n",
164
+ "raw_datasets[\"test\"] = load_streaming_dataset(\"mozilla-foundation/common_voice_11_0\", \"sr\", split=\"test\", use_auth_token=True)"
165
  ]
166
  },
167
  {
 
197
  "execution_count": 3,
198
  "id": "77d9f0c5-8607-4642-a8ac-c3ab2e223ea6",
199
  "metadata": {},
200
+ "outputs": [],
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
201
  "source": [
202
  "from transformers import WhisperProcessor\n",
203
  "\n",
204
+ "processor = WhisperProcessor.from_pretrained(\"openai/whisper-small\", language=\"Serbian\", task=\"transcribe\")"
205
  ]
206
  },
207
  {
 
559
  "execution_count": 14,
560
  "id": "b22b4011-f31f-4b57-b684-c52332f92890",
561
  "metadata": {},
562
+ "outputs": [],
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
563
  "source": [
564
  "import evaluate\n",
565
  "\n",
 
638
  "execution_count": 16,
639
  "id": "5a10cc4b-07ec-4ebd-ac1d-7c601023594f",
640
  "metadata": {},
641
+ "outputs": [],
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
642
  "source": [
643
  "from transformers import WhisperForConditionalGeneration\n",
644
  "\n",
645
+ "model = WhisperForConditionalGeneration.from_pretrained(\"checkpoint-2000\")"
646
  ]
647
  },
648
  {
 
865
  " Gradient Accumulation steps = 1\n",
866
  " Total optimization steps = 2000\n",
867
  " Number of trainable parameters = 241734912\n",
868
+ "Reading metadata...: 1045it [00:00, 5692.34it/s]\n",
869
+ "Reading metadata...: 623it [00:00, 4270.71it/s]\n",
870
  "The following columns in the training set don't have a corresponding argument in `WhisperForConditionalGeneration.forward` and have been ignored: input_length. If input_length are not expected by `WhisperForConditionalGeneration.forward`, you can safely ignore this message.\n"
871
  ]
872
  },
 
876
  "\n",
877
  " <div>\n",
878
  " \n",
879
+ " <progress value='1001' max='2000' style='width:300px; height:20px; vertical-align: middle;'></progress>\n",
880
+ " [1001/2000 1:45:14 < 1:45:14, 0.16 it/s, Epoch 49.01/9223372036854775807]\n",
881
  " </div>\n",
882
  " <table border=\"1\" class=\"dataframe\">\n",
883
  " <thead>\n",
 
885
  " <th>Step</th>\n",
886
  " <th>Training Loss</th>\n",
887
  " <th>Validation Loss</th>\n",
 
888
  " </tr>\n",
889
  " </thead>\n",
890
  " <tbody>\n",
 
 
 
 
 
 
891
  " </tbody>\n",
892
  "</table><p>"
893
  ],
 
902
  "name": "stderr",
903
  "output_type": "stream",
904
  "text": [
905
+ "Reading metadata...: 1045it [00:00, 5867.31it/s]\n",
906
+ "Reading metadata...: 623it [00:00, 4899.32it/s]\n",
907
+ "Reading metadata...: 1045it [00:00, 10001.87it/s]\n",
908
+ "Reading metadata...: 623it [00:00, 4402.30it/s]\n",
909
+ "Reading metadata...: 1045it [00:00, 10266.26it/s]\n",
910
+ "Reading metadata...: 623it [00:00, 3253.67it/s]\n",
911
+ "Reading metadata...: 1045it [00:00, 13354.24it/s]\n",
912
+ "Reading metadata...: 623it [00:00, 7292.22it/s]\n",
913
+ "Reading metadata...: 1045it [00:00, 33723.01it/s]\n",
914
+ "Reading metadata...: 623it [00:00, 28938.73it/s]\n",
915
+ "Reading metadata...: 1045it [00:00, 12782.78it/s]\n",
916
+ "Reading metadata...: 623it [00:00, 6901.10it/s]\n",
917
+ "Reading metadata...: 1045it [00:00, 34292.66it/s]\n",
918
+ "Reading metadata...: 623it [00:00, 33494.65it/s]\n",
919
+ "Reading metadata...: 1045it [00:00, 39667.03it/s]\n",
920
+ "Reading metadata...: 623it [00:00, 28214.13it/s]\n",
921
+ "Reading metadata...: 1045it [00:00, 42047.25it/s]\n",
922
+ "Reading metadata...: 623it [00:00, 32434.88it/s]\n",
923
+ "Reading metadata...: 1045it [00:00, 41330.01it/s]\n",
924
+ "Reading metadata...: 623it [00:00, 32047.04it/s]\n",
925
+ "Reading metadata...: 1045it [00:00, 29199.29it/s]\n",
926
+ "Reading metadata...: 623it [00:00, 30785.24it/s]\n",
927
+ "Reading metadata...: 1045it [00:00, 42721.43it/s]\n",
928
+ "Reading metadata...: 623it [00:00, 19130.06it/s]\n",
929
+ "Reading metadata...: 1045it [00:01, 738.01it/s]\n",
930
+ "Reading metadata...: 623it [00:01, 541.43it/s]\n",
931
+ "Reading metadata...: 1045it [00:00, 44482.59it/s]\n",
932
+ "Reading metadata...: 623it [00:00, 32484.48it/s]\n",
933
+ "Reading metadata...: 1045it [00:00, 41314.82it/s]\n",
934
+ "Reading metadata...: 623it [00:00, 28735.69it/s]\n",
935
+ "Reading metadata...: 1045it [00:00, 44215.15it/s]\n",
936
+ "Reading metadata...: 623it [00:00, 31580.71it/s]\n",
937
+ "Reading metadata...: 1045it [00:00, 1623.63it/s]\n",
938
+ "Reading metadata...: 623it [00:00, 1009.77it/s]\n",
939
+ "Reading metadata...: 1045it [00:00, 44171.93it/s]\n",
940
+ "Reading metadata...: 623it [00:00, 30811.38it/s]\n",
941
+ "Reading metadata...: 1045it [00:00, 43079.18it/s]\n",
942
+ "Reading metadata...: 623it [00:00, 15485.94it/s]\n",
943
+ "Reading metadata...: 1045it [00:00, 40702.87it/s]\n",
944
+ "Reading metadata...: 623it [00:00, 28661.31it/s]\n",
945
+ "Reading metadata...: 1045it [00:00, 44402.38it/s]\n",
946
+ "Reading metadata...: 623it [00:00, 31105.90it/s]\n",
947
+ "Reading metadata...: 1045it [00:00, 24505.06it/s]\n",
948
+ "Reading metadata...: 623it [00:00, 19740.06it/s]\n",
949
+ "Reading metadata...: 1045it [00:00, 4819.73it/s]\n",
950
+ "Reading metadata...: 623it [00:00, 4116.76it/s]\n",
951
+ "Reading metadata...: 1045it [00:00, 42929.81it/s]\n",
952
+ "Reading metadata...: 623it [00:00, 30741.78it/s]\n",
953
+ "Reading metadata...: 1045it [00:00, 9124.52it/s]\n",
954
+ "Reading metadata...: 623it [00:00, 4622.41it/s]\n",
955
+ "Reading metadata...: 1045it [00:00, 40983.75it/s]\n",
956
+ "Reading metadata...: 623it [00:00, 28923.67it/s]\n",
957
+ "Reading metadata...: 1045it [00:00, 9164.05it/s]\n",
958
+ "Reading metadata...: 623it [00:00, 5771.93it/s]\n",
959
+ "Reading metadata...: 1045it [00:00, 6674.98it/s]\n",
960
+ "Reading metadata...: 623it [00:00, 3780.80it/s]\n",
961
+ "Reading metadata...: 1045it [00:00, 43593.76it/s]\n",
962
+ "Reading metadata...: 623it [00:00, 21590.29it/s]\n",
963
+ "Reading metadata...: 1045it [00:00, 41968.74it/s]\n",
964
+ "Reading metadata...: 623it [00:00, 32694.20it/s]\n",
965
+ "Reading metadata...: 1045it [00:00, 17046.83it/s]\n",
966
+ "Reading metadata...: 623it [00:00, 11208.51it/s]\n",
967
+ "Reading metadata...: 1045it [00:00, 37953.07it/s]\n",
968
+ "Reading metadata...: 623it [00:00, 31590.64it/s]\n",
969
+ "Reading metadata...: 1045it [00:00, 39963.96it/s]\n",
970
+ "Reading metadata...: 623it [00:00, 30293.44it/s]\n",
971
+ "Reading metadata...: 1045it [00:00, 45293.92it/s]\n",
972
+ "Reading metadata...: 623it [00:00, 28211.39it/s]\n",
973
+ "Reading metadata...: 1045it [00:00, 3469.64it/s]\n",
974
+ "Reading metadata...: 623it [00:00, 6854.28it/s]\n",
975
+ "Reading metadata...: 1045it [00:00, 43085.10it/s]\n",
976
+ "Reading metadata...: 623it [00:00, 33438.50it/s]\n",
977
+ "Reading metadata...: 1045it [00:00, 32567.86it/s]\n",
978
+ "Reading metadata...: 623it [00:00, 27699.11it/s]\n",
979
+ "Reading metadata...: 1045it [00:00, 42481.27it/s]\n",
980
+ "Reading metadata...: 623it [00:00, 31889.43it/s]\n",
981
+ "Reading metadata...: 1045it [00:00, 16001.43it/s]\n",
982
+ "Reading metadata...: 623it [00:00, 13026.76it/s]\n",
983
+ "Reading metadata...: 1045it [00:00, 45249.50it/s]\n",
984
+ "Reading metadata...: 623it [00:00, 27699.70it/s]\n",
985
+ "Reading metadata...: 1045it [00:00, 41886.92it/s]\n",
986
+ "Reading metadata...: 623it [00:00, 30486.41it/s]\n",
987
+ "Reading metadata...: 1045it [00:00, 39246.49it/s]\n",
988
+ "Reading metadata...: 623it [00:00, 29180.46it/s]\n",
989
+ "Reading metadata...: 1045it [00:00, 40768.74it/s]\n",
990
+ "Reading metadata...: 623it [00:00, 25073.18it/s]\n",
991
+ "Reading metadata...: 1045it [00:00, 41413.97it/s]\n",
992
+ "Reading metadata...: 623it [00:00, 34066.69it/s]\n",
993
+ "Reading metadata...: 1045it [00:00, 43446.41it/s]\n",
994
+ "Reading metadata...: 623it [00:00, 14088.58it/s]\n",
995
+ "Reading metadata...: 1045it [00:00, 42264.17it/s]\n",
996
+ "Reading metadata...: 623it [00:00, 33832.48it/s]\n",
997
+ "Reading metadata...: 1045it [00:00, 35855.79it/s]\n",
998
+ "Reading metadata...: 623it [00:00, 14966.70it/s]\n",
999
+ "Reading metadata...: 1045it [00:00, 37491.43it/s]\n",
1000
+ "Reading metadata...: 623it [00:00, 25462.13it/s]\n",
1001
+ "Reading metadata...: 1045it [00:00, 18279.76it/s]\n",
1002
+ "Reading metadata...: 623it [00:00, 9944.59it/s]\n",
1003
  "***** Running Evaluation *****\n",
1004
  " Num examples: Unknown\n",
1005
  " Batch size = 8\n",
1006
+ "Reading metadata...: 677it [00:00, 4738.28it/s]\n",
1007
  "The following columns in the evaluation set don't have a corresponding argument in `WhisperForConditionalGeneration.forward` and have been ignored: input_length. If input_length are not expected by `WhisperForConditionalGeneration.forward`, you can safely ignore this message.\n"
1008
  ]
1009
  }
 
1042
  "kwargs = {\n",
1043
  " \"dataset_tags\": \"mozilla-foundation/common_voice_11_0\",\n",
1044
  " \"dataset\": \"Common Voice 11.0\", # a 'pretty' name for the training dataset\n",
1045
+ " \"model_name\": \"Whisper Small Lithuanian and Serbian sequentially trained\", # a 'pretty' name for your model\n",
 
1046
  " \"finetuned_from\": \"openai/whisper-small\",\n",
1047
  " \"tasks\": \"automatic-speech-recognition\",\n",
1048
  " \"tags\": \"whisper-event\",\n",
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5a11f74090959c07ae26487bc3ce05849151ba32d0f718c8ab6924c218bbc666
3
  size 967102601
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c102a56223c9d4c0073bf307faa42881b324cda17921f66be674baeaac81536
3
  size 967102601
runs/Dec15_09-48-30_129-213-18-196/events.out.tfevents.1671097754.129-213-18-196.69807.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0c18ec6a9ca2b818981f832541fefb0d38fab7f8805614f1308ce1609f3f6941
3
- size 17468
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:111a1faf82a941b0dd777617baa73f1608b1d0d430dce19d00ba139736484de6
3
+ size 17822
runs/Dec15_14-18-11_129-213-18-196/1671113929.6254616/events.out.tfevents.1671113929.129-213-18-196.4128231.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e59c4de1c5f36a53463a3c2eb9bdca8cf8c8cce7e955aab755b08013d5a8b019
3
+ size 5864
runs/Dec15_14-18-11_129-213-18-196/events.out.tfevents.1671113929.129-213-18-196.4128231.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79e3c278a91be84dc37fe3af83dfcdc461de029979a79195988c9f7a1dbaf16e
3
+ size 10865
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:12802b2bf7011dc5b5a4acdb33b6f00f752ead32935befd31c68ab349d5b2f84
3
  size 3579
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d3f2bc41361967c98d61c9072b7d10b71ba361fe800039babbb310b5e56c86cb
3
  size 3579