Spaces:

Maximofn
/

subtify

Sleeping

App Files Files Community

Maximofn commited on Oct 23, 2023

Commit

9ecf696

•

1 Parent(s): 7bfb36e

Script for concatenate chunck transcriptions into one file

Browse files

Files changed (1) hide show

concat_transcriptions.py +77 -0

concat_transcriptions.py ADDED Viewed

	@@ -0,0 +1,77 @@

+import argparse
+import re
+def sum_seconds(time, seconds):
+    # Get time in seconds
+    time = time.split(",")
+    milisecons = time[1]
+    time = time[0].split(":")
+    time = int(time[0])*3600 + int(time[1])*60 + int(time[2])
+    # Add seconds
+    time += seconds
+    # Get time in hh:mm:ss,mmm format
+    hours = time // 3600
+    minutes = (time % 3600) // 60
+    seconds = (time % 3600) % 60
+    time = f"{hours:02d}:{minutes:02d}:{seconds:02d},{milisecons}"
+    return time
+def main(args):
+    chunk_files = args.chunk_files
+    seconds = int(args.seconds)
+    speaker = int(args.speaker)
+    chunk_folder = "transcriptions"
+    output_folder = "concatenated_transcriptions"
+    transcription_extension = "srt"
+    # Read chunk files
+    with open(chunk_files, "r") as f:
+        files = f.read().splitlines()
+    # Concatenate transcriptions
+    transcription = ""
+    num_transcriptions = 1
+    for i, file in enumerate(files):
+        chunk = file
+        _, file = chunk.split("/")
+        file, _ = file.split(".")
+        transcription_chunk_file = f"{chunk_folder}/{file}_speaker{speaker:003d}.{transcription_extension}"
+        with open(transcription_chunk_file, "r") as f:
+            transcription_chunk = f.read().splitlines()
+        for line in transcription_chunk:
+            # if line is dd:dd:dd,ddd --> dd:dd:dd,ddd
+            if re.match(r"\d\d:\d\d:\d\d,\d\d\d --> \d\d:\d\d:\d\d,\d\d\d", line):
+                # Get start time (dd:dd:dd,ddd) and end time (dd:dd:dd,ddd)
+                start, end = line.split(" --> ")
+                # Add seconds to start and end time
+                start = sum_seconds(start, i*seconds)
+                end = sum_seconds(end, seconds)
+                # Add to transcription
+                transcription += f"{start} --> {end}\n"
+            # if line is a number and carriage return --> number
+            elif re.match(r"\d+$", line):
+                transcription += f"{num_transcriptions}\n"
+                num_transcriptions += 1
+            else:
+                transcription += f"{line}\n"
+    # Write transcription
+    file_split = file.split("_")[:-1]
+    file = "_".join(file_split)
+    output_file = f"{output_folder}/{file}_speaker{speaker:003d}.{transcription_extension}"
+    with open(output_file, "w") as f:
+        f.write(transcription)
+if __name__ == "__main__":
+    parser = argparse.ArgumentParser()
+    parser.add_argument("chunk_files", help="Path to the file containing the paths to the chunk files")
+    parser.add_argument("seconds", help="Duration of each chunk in seconds")
+    parser.add_argument("speaker", help="Speaker name")
+    args = parser.parse_args()
+    main(args)