Training in progress, step 1000
Browse files- pytorch_model.bin +1 -1
- run.sh +4 -4
- run_speech_recognition_seq2seq_streaming.py +8 -4
- runs/Dec12_16-17-24_spartan-gpgpu115.hpc.unimelb.edu.au/1670822323.3846912/events.out.tfevents.1670822323.spartan-gpgpu115.hpc.unimelb.edu.au.248583.1 +3 -0
- runs/Dec12_16-17-24_spartan-gpgpu115.hpc.unimelb.edu.au/events.out.tfevents.1670822323.spartan-gpgpu115.hpc.unimelb.edu.au.248583.0 +3 -0
- runs/Dec12_18-44-54_spartan-gpgpu115.hpc.unimelb.edu.au/1670831139.1402473/events.out.tfevents.1670831139.spartan-gpgpu115.hpc.unimelb.edu.au.146080.1 +3 -0
- runs/Dec12_18-44-54_spartan-gpgpu115.hpc.unimelb.edu.au/events.out.tfevents.1670831139.spartan-gpgpu115.hpc.unimelb.edu.au.146080.0 +3 -0
- training_args.bin +1 -1
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 6173655480
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7102a6b0b37c636335ba700287e7fcad791b55cc59af204105d8d3dfb248cf52
|
3 |
size 6173655480
|
run.sh
CHANGED
@@ -6,17 +6,17 @@ python run_speech_recognition_seq2seq_streaming.py \
|
|
6 |
--train_split_name="train+validation" \
|
7 |
--eval_split_name="test" \
|
8 |
--model_index_name="Whisper Large Vietnamese" \
|
9 |
-
--max_steps="
|
10 |
--output_dir="./" \
|
11 |
--per_device_train_batch_size="32" \
|
12 |
--per_device_eval_batch_size="16" \
|
13 |
--logging_steps="25" \
|
14 |
-
--learning_rate="1e-
|
15 |
--warmup_steps="100" \
|
16 |
--evaluation_strategy="steps" \
|
17 |
-
--eval_steps="
|
18 |
--save_strategy="steps" \
|
19 |
-
--save_steps="
|
20 |
--generation_max_length="225" \
|
21 |
--length_column_name="input_length" \
|
22 |
--max_duration_in_seconds="30" \
|
|
|
6 |
--train_split_name="train+validation" \
|
7 |
--eval_split_name="test" \
|
8 |
--model_index_name="Whisper Large Vietnamese" \
|
9 |
+
--max_steps="5000" \
|
10 |
--output_dir="./" \
|
11 |
--per_device_train_batch_size="32" \
|
12 |
--per_device_eval_batch_size="16" \
|
13 |
--logging_steps="25" \
|
14 |
+
--learning_rate="1e-6" \
|
15 |
--warmup_steps="100" \
|
16 |
--evaluation_strategy="steps" \
|
17 |
+
--eval_steps="1000" \
|
18 |
--save_strategy="steps" \
|
19 |
+
--save_steps="1000" \
|
20 |
--generation_max_length="225" \
|
21 |
--length_column_name="input_length" \
|
22 |
--max_duration_in_seconds="30" \
|
run_speech_recognition_seq2seq_streaming.py
CHANGED
@@ -501,10 +501,11 @@ def main():
|
|
501 |
def is_audio_in_length_range(length):
|
502 |
return min_input_length < length < max_input_length
|
503 |
|
504 |
-
|
505 |
-
|
506 |
-
|
507 |
-
|
|
|
508 |
|
509 |
# 8. Load Metric
|
510 |
metric = evaluate.load("wer")
|
@@ -522,6 +523,9 @@ def main():
|
|
522 |
if do_normalize_eval:
|
523 |
pred_str = [normalizer(pred) for pred in pred_str]
|
524 |
label_str = [normalizer(label) for label in label_str]
|
|
|
|
|
|
|
525 |
|
526 |
wer = 100 * metric.compute(predictions=pred_str, references=label_str)
|
527 |
|
|
|
501 |
def is_audio_in_length_range(length):
|
502 |
return min_input_length < length < max_input_length
|
503 |
|
504 |
+
if training_args.do_train:
|
505 |
+
vectorized_datasets["train"] = vectorized_datasets["train"].filter(
|
506 |
+
is_audio_in_length_range,
|
507 |
+
input_columns=["input_length"],
|
508 |
+
)
|
509 |
|
510 |
# 8. Load Metric
|
511 |
metric = evaluate.load("wer")
|
|
|
523 |
if do_normalize_eval:
|
524 |
pred_str = [normalizer(pred) for pred in pred_str]
|
525 |
label_str = [normalizer(label) for label in label_str]
|
526 |
+
# filtering step to only evaluate the samples that correspond to non-zero references:
|
527 |
+
pred_str = [pred_str[i] for i in range(len(pred_str)) if len(label_str[i]) > 0]
|
528 |
+
label_str = [label_str[i] for i in range(len(label_str)) if len(label_str[i]) > 0]
|
529 |
|
530 |
wer = 100 * metric.compute(predictions=pred_str, references=label_str)
|
531 |
|
runs/Dec12_16-17-24_spartan-gpgpu115.hpc.unimelb.edu.au/1670822323.3846912/events.out.tfevents.1670822323.spartan-gpgpu115.hpc.unimelb.edu.au.248583.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ce0047001e53c6fe1d14167b5b5fb1fa5f87196f1e7de29cd173591852bc6cc
|
3 |
+
size 5730
|
runs/Dec12_16-17-24_spartan-gpgpu115.hpc.unimelb.edu.au/events.out.tfevents.1670822323.spartan-gpgpu115.hpc.unimelb.edu.au.248583.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9dea4a566557912ace98f6d6d7b35a7f9a5f72a52f0a425e7e32c22790d66d7f
|
3 |
+
size 4203
|
runs/Dec12_18-44-54_spartan-gpgpu115.hpc.unimelb.edu.au/1670831139.1402473/events.out.tfevents.1670831139.spartan-gpgpu115.hpc.unimelb.edu.au.146080.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c7e19cba18916450c4882276ba80316dc46b320da86e129cb8c6e7cad1ac7d16
|
3 |
+
size 5730
|
runs/Dec12_18-44-54_spartan-gpgpu115.hpc.unimelb.edu.au/events.out.tfevents.1670831139.spartan-gpgpu115.hpc.unimelb.edu.au.146080.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a470c12c1f15c6ba258717c9b1462892974cc1419b9296ef55fd07467047b3e0
|
3 |
+
size 10786
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3515
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:46a814996c8c7be78345a57772149f9ab0950a112cff44d30a75b7b82eb3b63e
|
3 |
size 3515
|