Maximofn commited on
Commit
4d57eee
1 Parent(s): bc986ed

Create script to transcript audios

Browse files
Files changed (1) hide show
  1. transcribe.py +26 -0
transcribe.py ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import os
2
+ import argparse
3
+
4
+ def main(args):
5
+ audio_file = args.input
6
+ language = args.language
7
+ output_folder = "transcriptions"
8
+
9
+ # Transcribe audio file
10
+ model = "large-v2"
11
+ word_timestamps = True
12
+ fp16 = False
13
+ device = "cuda"
14
+ verbose = False
15
+ threads = 4
16
+ command = f'whisper --model {model} --output_dir {output_folder} --language {language} \
17
+ --word_timestamps {word_timestamps} --fp16 {fp16} --device {device} --verbose {verbose} \
18
+ --threads {threads} {audio_file}'
19
+ os.system(command)
20
+
21
+ if __name__ == "__main__":
22
+ parser = argparse.ArgumentParser(description='Transcribe audio files')
23
+ parser.add_argument('input', help='Input audio file')
24
+ parser.add_argument('language', help='Language of the audio file')
25
+ args = parser.parse_args()
26
+ main(args)