Maximofn commited on
Commit
119cb0d
1 Parent(s): 96bc450

Add progress bar to translate trasnlations script

Browse files
Files changed (1) hide show
  1. translate_transcriptions.py +3 -0
translate_transcriptions.py CHANGED
@@ -3,6 +3,7 @@ from transformers import MBartForConditionalGeneration, MBart50TokenizerFast
3
  from lang_list import LANGUAGE_NAME_TO_CODE, WHISPER_LANGUAGES
4
  import argparse
5
  import re
 
6
 
7
  language_dict = {}
8
  # Iterate over the LANGUAGE_NAME_TO_CODE dictionary
@@ -45,6 +46,7 @@ def main(transcription_file, source_languaje, target_languaje, translate_model,
45
 
46
  # Translate
47
  translate_transcription = ""
 
48
  for line in transcription:
49
  if re.match(r"\d+$", line):
50
  translate_transcription += f"{line}\n"
@@ -56,6 +58,7 @@ def main(transcription_file, source_languaje, target_languaje, translate_model,
56
  translated = translate(line, source_languaje, target_languaje, translate_model, translate_tokenizer, device)
57
  # translated = line
58
  translate_transcription += f"{translated}\n"
 
59
 
60
  # Save translation
61
  output_file = f"{output_folder}/{transcription_file_name}_{target_languaje}.srt"
 
3
  from lang_list import LANGUAGE_NAME_TO_CODE, WHISPER_LANGUAGES
4
  import argparse
5
  import re
6
+ from tqdm import tqdm
7
 
8
  language_dict = {}
9
  # Iterate over the LANGUAGE_NAME_TO_CODE dictionary
 
46
 
47
  # Translate
48
  translate_transcription = ""
49
+ progress_bar = tqdm(total=len(transcription), desc='Translating transcription progress')
50
  for line in transcription:
51
  if re.match(r"\d+$", line):
52
  translate_transcription += f"{line}\n"
 
58
  translated = translate(line, source_languaje, target_languaje, translate_model, translate_tokenizer, device)
59
  # translated = line
60
  translate_transcription += f"{translated}\n"
61
+ progress_bar.update(1)
62
 
63
  # Save translation
64
  output_file = f"{output_folder}/{transcription_file_name}_{target_languaje}.srt"