joey234 commited on
Commit
66bd910
·
1 Parent(s): 6cfd8b0

Training in progress, step 1000

Browse files
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e5447c8090dadc8995e3c0111e08b30c73a5a9c06c4b2511e4a5bcb050133486
3
  size 6173655480
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7102a6b0b37c636335ba700287e7fcad791b55cc59af204105d8d3dfb248cf52
3
  size 6173655480
run.sh CHANGED
@@ -6,17 +6,17 @@ python run_speech_recognition_seq2seq_streaming.py \
6
  --train_split_name="train+validation" \
7
  --eval_split_name="test" \
8
  --model_index_name="Whisper Large Vietnamese" \
9
- --max_steps="1000" \
10
  --output_dir="./" \
11
  --per_device_train_batch_size="32" \
12
  --per_device_eval_batch_size="16" \
13
  --logging_steps="25" \
14
- --learning_rate="1e-5" \
15
  --warmup_steps="100" \
16
  --evaluation_strategy="steps" \
17
- --eval_steps="250" \
18
  --save_strategy="steps" \
19
- --save_steps="250" \
20
  --generation_max_length="225" \
21
  --length_column_name="input_length" \
22
  --max_duration_in_seconds="30" \
 
6
  --train_split_name="train+validation" \
7
  --eval_split_name="test" \
8
  --model_index_name="Whisper Large Vietnamese" \
9
+ --max_steps="5000" \
10
  --output_dir="./" \
11
  --per_device_train_batch_size="32" \
12
  --per_device_eval_batch_size="16" \
13
  --logging_steps="25" \
14
+ --learning_rate="1e-6" \
15
  --warmup_steps="100" \
16
  --evaluation_strategy="steps" \
17
+ --eval_steps="1000" \
18
  --save_strategy="steps" \
19
+ --save_steps="1000" \
20
  --generation_max_length="225" \
21
  --length_column_name="input_length" \
22
  --max_duration_in_seconds="30" \
run_speech_recognition_seq2seq_streaming.py CHANGED
@@ -501,10 +501,11 @@ def main():
501
  def is_audio_in_length_range(length):
502
  return min_input_length < length < max_input_length
503
 
504
- vectorized_datasets["train"] = vectorized_datasets["train"].filter(
505
- is_audio_in_length_range,
506
- input_columns=["input_length"],
507
- )
 
508
 
509
  # 8. Load Metric
510
  metric = evaluate.load("wer")
@@ -522,6 +523,9 @@ def main():
522
  if do_normalize_eval:
523
  pred_str = [normalizer(pred) for pred in pred_str]
524
  label_str = [normalizer(label) for label in label_str]
 
 
 
525
 
526
  wer = 100 * metric.compute(predictions=pred_str, references=label_str)
527
 
 
501
  def is_audio_in_length_range(length):
502
  return min_input_length < length < max_input_length
503
 
504
+ if training_args.do_train:
505
+ vectorized_datasets["train"] = vectorized_datasets["train"].filter(
506
+ is_audio_in_length_range,
507
+ input_columns=["input_length"],
508
+ )
509
 
510
  # 8. Load Metric
511
  metric = evaluate.load("wer")
 
523
  if do_normalize_eval:
524
  pred_str = [normalizer(pred) for pred in pred_str]
525
  label_str = [normalizer(label) for label in label_str]
526
+ # filtering step to only evaluate the samples that correspond to non-zero references:
527
+ pred_str = [pred_str[i] for i in range(len(pred_str)) if len(label_str[i]) > 0]
528
+ label_str = [label_str[i] for i in range(len(label_str)) if len(label_str[i]) > 0]
529
 
530
  wer = 100 * metric.compute(predictions=pred_str, references=label_str)
531
 
runs/Dec12_16-17-24_spartan-gpgpu115.hpc.unimelb.edu.au/1670822323.3846912/events.out.tfevents.1670822323.spartan-gpgpu115.hpc.unimelb.edu.au.248583.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ce0047001e53c6fe1d14167b5b5fb1fa5f87196f1e7de29cd173591852bc6cc
3
+ size 5730
runs/Dec12_16-17-24_spartan-gpgpu115.hpc.unimelb.edu.au/events.out.tfevents.1670822323.spartan-gpgpu115.hpc.unimelb.edu.au.248583.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9dea4a566557912ace98f6d6d7b35a7f9a5f72a52f0a425e7e32c22790d66d7f
3
+ size 4203
runs/Dec12_18-44-54_spartan-gpgpu115.hpc.unimelb.edu.au/1670831139.1402473/events.out.tfevents.1670831139.spartan-gpgpu115.hpc.unimelb.edu.au.146080.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c7e19cba18916450c4882276ba80316dc46b320da86e129cb8c6e7cad1ac7d16
3
+ size 5730
runs/Dec12_18-44-54_spartan-gpgpu115.hpc.unimelb.edu.au/events.out.tfevents.1670831139.spartan-gpgpu115.hpc.unimelb.edu.au.146080.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a470c12c1f15c6ba258717c9b1462892974cc1419b9296ef55fd07467047b3e0
3
+ size 10786
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a94b1449f30d120ad9017982c5fa06a4324241f23aab28f07da46bce5ae0d57d
3
  size 3515
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:46a814996c8c7be78345a57772149f9ab0950a112cff44d30a75b7b82eb3b63e
3
  size 3515