MultiMed

Runtime error

App Files Files Community

Tonic commited on Nov 19, 2023

Commit

16c1c4f

•

1 Parent(s): 342fcb6

Update app.py

Browse files

Files changed (1) hide show

app.py +13 -12

app.py CHANGED Viewed

@@ -1,7 +1,6 @@
 # Welcome to Team Tonic's MultiMed
 from gradio_client import Client
-import os
 import numpy as np
 import base64
 import gradio as gr
@@ -10,10 +9,10 @@ import requests
 import json
 import dotenv
 from scipy.io.wavfile import write
-import PIL
 import soundfile as sf
 from openai import OpenAI
 import time
 from PIL import Image
 import io
 import hashlib
@@ -28,6 +27,8 @@ from transformers import AutoConfig, AutoTokenizer, AutoModelForSeq2SeqLM, AutoM
 from peft import PeftModel, PeftConfig
 import torch
 import os
 # Global variables to hold component references
 components = {}
@@ -120,9 +121,10 @@ def process_speech(input_language, audio_input):
     except Exception as e :
         return f"{e}"
 def convert_text_to_speech(input_text, target_language):
     """
-    Convert text to speech in the specified language and return the audio file path and the input text.
     """
     try:
         text_to_speech_result = seamless_client.predict(
@@ -136,17 +138,16 @@ def convert_text_to_speech(input_text, target_language):
             api_name="/run"  # API name
         )
-        # Assuming the audio file path is in the second position of the result
-        audio_file = text_to_speech_result[1]
-        max_length = 25
-        dir_name, file_name = os.path.split(audio_file)
-        file_extension = os.path.splitext(file_name)[1]
-        shortened_file_name = file_name[:max_length - len(file_extension)] + file_extension
-        shortened_audio_file = os.path.join(dir_name, shortened_file_name)
-        # Return the shortened audio file path and the input text
-        return shortened_audio_file, input_text
     except Exception as e:
         return f"An error occurred during text-to-speech conversion: {e}", input_text

 # Welcome to Team Tonic's MultiMed
 from gradio_client import Client
 import numpy as np
 import base64
 import gradio as gr
 import json
 import dotenv
 from scipy.io.wavfile import write
 import soundfile as sf
 from openai import OpenAI
 import time
+import PIL
 from PIL import Image
 import io
 import hashlib
 from peft import PeftModel, PeftConfig
 import torch
 import os
+import uuid
 # Global variables to hold component references
 components = {}
     except Exception as e :
         return f"{e}"
 def convert_text_to_speech(input_text, target_language):
     """
+    Convert text to speech in the specified language, rename the audio file with a unique identifier, and return both the new audio file path and the input text.
     """
     try:
         text_to_speech_result = seamless_client.predict(
             api_name="/run"  # API name
         )
+        original_audio_file = text_to_speech_result[1]  # Assuming the audio file path is in the second position
+        # Generate a new file name with a random UUID
+        new_file_name = f"audio_output_{uuid.uuid4()}.wav"
+        new_file_path = os.path.join(os.path.dirname(original_audio_file), new_file_name)
+        # Rename the file
+        os.rename(original_audio_file, new_file_path)
+        return new_file_path, input_text
     except Exception as e:
         return f"An error occurred during text-to-speech conversion: {e}", input_text