Jingmiao commited on
Commit
f383db3
1 Parent(s): 62e0d50

Training in progress, step 1000

Browse files
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7a27130315b5147db7b9315597e9857ff6aea1ac62aa8f8a1e9b4b3f10ad5fa9
3
  size 967102601
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d209be948a097f78946d50db10de9282b601215dc1a3b48b1770e9ef2a71a643
3
  size 967102601
run.sh CHANGED
@@ -226,3 +226,155 @@ python run_speech_recognition_seq2seq_streaming.py \
226
  --streaming \
227
  --use_auth_token \
228
  --push_to_hub
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
226
  --streaming \
227
  --use_auth_token \
228
  --push_to_hub
229
+ python run_speech_recognition_seq2seq_streaming.py \
230
+ --model_name_or_path="openai/whisper-small" \
231
+ -- dataset_name = "google/fleurs"
232
+ --dataset_config_name="cmn_hans_cn" \
233
+ --language="chinese" \
234
+ --train_split_name="train+validation" \
235
+ --eval_split_name="test" \
236
+ --model_index_name="Whisper Small Chinese Mandarin Base Dataset" \
237
+ --max_steps="5000" \
238
+ --output_dir="./" \
239
+ --per_device_train_batch_size="64" \
240
+ --per_device_eval_batch_size="32" \
241
+ --logging_steps="25" \
242
+ --learning_rate="1e-5" \
243
+ --warmup_steps="500" \
244
+ --evaluation_strategy="steps" \
245
+ --eval_steps="1000" \
246
+ --save_strategy="steps" \
247
+ --save_steps="1000" \
248
+ --generation_max_length="225" \
249
+ --length_column_name="input_length" \
250
+ --max_duration_in_seconds="30" \
251
+ --text_column_name="sentence" \
252
+ --freeze_feature_encoder="False" \
253
+ --report_to="tensorboard" \
254
+ --metric_for_best_model="wer" \
255
+ --greater_is_better="False" \
256
+ --load_best_model_at_end \
257
+ --gradient_checkpointing \
258
+ --fp16 \
259
+ --overwrite_output_dir \
260
+ --do_train \
261
+ --do_eval \
262
+ --predict_with_generate \
263
+ --do_normalize_eval \
264
+ --streaming \
265
+ --use_auth_token \
266
+ --push_to_hub
267
+ python run_speech_recognition_seq2seq_streaming.py \
268
+ --model_name_or_path="openai/whisper-small" \
269
+ -- dataset_name = "google/fleurs"
270
+ --dataset_config_name="cmn_hans_cn" \
271
+ --language="chinese" \
272
+ --train_split_name="train+validation" \
273
+ --eval_split_name="test" \
274
+ --model_index_name="Whisper Small Chinese Mandarin Base Dataset" \
275
+ --max_steps="5000" \
276
+ --output_dir="./" \
277
+ --per_device_train_batch_size="64" \
278
+ --per_device_eval_batch_size="32" \
279
+ --logging_steps="25" \
280
+ --learning_rate="1e-5" \
281
+ --warmup_steps="500" \
282
+ --evaluation_strategy="steps" \
283
+ --eval_steps="1000" \
284
+ --save_strategy="steps" \
285
+ --save_steps="1000" \
286
+ --generation_max_length="225" \
287
+ --length_column_name="input_length" \
288
+ --max_duration_in_seconds="30" \
289
+ --text_column_name="sentence" \
290
+ --freeze_feature_encoder="False" \
291
+ --report_to="tensorboard" \
292
+ --metric_for_best_model="wer" \
293
+ --greater_is_better="False" \
294
+ --load_best_model_at_end \
295
+ --gradient_checkpointing \
296
+ --fp16 \
297
+ --overwrite_output_dir \
298
+ --do_train \
299
+ --do_eval \
300
+ --predict_with_generate \
301
+ --do_normalize_eval \
302
+ --streaming \
303
+ --use_auth_token \
304
+ --push_to_hub
305
+ python run_speech_recognition_seq2seq_streaming.py \
306
+ --model_name_or_path="Jingmiao/whisper-small-chinese_base" \
307
+ --dataset_name="mozilla-foundation/common_voice_11_" \
308
+ --dataset_config_name="zh-TW" \
309
+ --language="chinese" \
310
+ --train_split_name="train+validation" \
311
+ --eval_split_name="test" \
312
+ --model_index_name="Whisper Small TW on Chinese base" \
313
+ --max_steps="5000" \
314
+ --output_dir="./" \
315
+ --per_device_train_batch_size="64" \
316
+ --per_device_eval_batch_size="32" \
317
+ --logging_steps="25" \
318
+ --learning_rate="1e-5" \
319
+ --warmup_steps="500" \
320
+ --evaluation_strategy="steps" \
321
+ --eval_steps="1000" \
322
+ --save_strategy="steps" \
323
+ --save_steps="1000" \
324
+ --generation_max_length="225" \
325
+ --length_column_name="input_length" \
326
+ --max_duration_in_seconds="30" \
327
+ --text_column_name="sentence" \
328
+ --freeze_feature_encoder="False" \
329
+ --report_to="tensorboard" \
330
+ --metric_for_best_model="wer" \
331
+ --greater_is_better="False" \
332
+ --load_best_model_at_end \
333
+ --gradient_checkpointing \
334
+ --fp16 \
335
+ --overwrite_output_dir \
336
+ --do_train \
337
+ --do_eval \
338
+ --predict_with_generate \
339
+ --do_normalize_eval \
340
+ --streaming \
341
+ --use_auth_token \
342
+ --push_to_hub
343
+ python run_speech_recognition_seq2seq_streaming.py \
344
+ --model_name_or_path="Jingmiao/whisper-small-chinese_base" \
345
+ --dataset_name="mozilla-foundation/common_voice_11_0" \
346
+ --dataset_config_name="zh-TW" \
347
+ --language="chinese" \
348
+ --train_split_name="train+validation" \
349
+ --eval_split_name="test" \
350
+ --model_index_name="Whisper Small TW on Chinese base" \
351
+ --max_steps="5000" \
352
+ --output_dir="./" \
353
+ --per_device_train_batch_size="64" \
354
+ --per_device_eval_batch_size="32" \
355
+ --logging_steps="25" \
356
+ --learning_rate="1e-5" \
357
+ --warmup_steps="500" \
358
+ --evaluation_strategy="steps" \
359
+ --eval_steps="1000" \
360
+ --save_strategy="steps" \
361
+ --save_steps="1000" \
362
+ --generation_max_length="225" \
363
+ --length_column_name="input_length" \
364
+ --max_duration_in_seconds="30" \
365
+ --text_column_name="sentence" \
366
+ --freeze_feature_encoder="False" \
367
+ --report_to="tensorboard" \
368
+ --metric_for_best_model="wer" \
369
+ --greater_is_better="False" \
370
+ --load_best_model_at_end \
371
+ --gradient_checkpointing \
372
+ --fp16 \
373
+ --overwrite_output_dir \
374
+ --do_train \
375
+ --do_eval \
376
+ --predict_with_generate \
377
+ --do_normalize_eval \
378
+ --streaming \
379
+ --use_auth_token \
380
+ --push_to_hub
runs/Dec19_00-14-40_129-213-131-109/1671408888.219753/events.out.tfevents.1671408888.129-213-131-109.84528.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f433a234dc2508d82126b0731dd5cc8f1560762e9d440118665891c86387fc2
3
+ size 5871
runs/Dec19_00-14-40_129-213-131-109/events.out.tfevents.1671408888.129-213-131-109.84528.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a84617fdbd2048bc0117d1c482462c70606a74aee8007acdde8362e5cb73839
3
+ size 4268
runs/Dec19_00-15-22_129-213-131-109/1671408930.5727222/events.out.tfevents.1671408930.129-213-131-109.84922.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c14780a7b4c8a3b50424218afcb84663c3152dfd8d2dc249b2fb0948c3bd2ed6
3
+ size 5871
runs/Dec19_00-15-22_129-213-131-109/events.out.tfevents.1671408930.129-213-131-109.84922.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5377c4b8ee88d4102c4b38f75c1fdf984a6904b6283488ee12a1df4b948f51fe
3
+ size 10851
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:04e3593c44117435b70a5e928d1be360435aa01916b3b5063b037e743189a76f
3
  size 3579
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66eea850f06cf43eb6ea191a013b50870ed87ef30fcfb5aad2c92fbf844595bd
3
  size 3579