Spaces:

yuangongfdu
/

ltu-2

Running

App Files Files Community

yuangongfdu commited on Aug 19, 2023

Commit

bfe831e

•

1 Parent(s): 7a2502d

Update app.py

Browse files

Files changed (1) hide show

app.py +18 -1

app.py CHANGED Viewed

@@ -1,9 +1,24 @@
 import json
 import gradio as gr
 import requests
 def upload_audio(audio_path):
     try:
         with open(audio_path, 'rb') as audio_file:
             response = requests.post('http://sls-titan-6.csail.mit.edu:8080/upload/', files={'audio_file': audio_file})
         if response.status_code == 200:
@@ -15,6 +30,8 @@ def predict(audio_path, question):
     upload_statues = upload_audio(audio_path)
     if upload_statues == None:
         return 'Please upload an audio file.'
     if question == '':
         return 'Please ask a question.'
     print(audio_path, question)
@@ -42,6 +59,6 @@ if __name__ == '__main__':
                         description="LTU-2 an improved version of LTU. LTU-2 is stronger in spoken text understanding and music understanding. <br>" +
                                     "LTU is authored by Yuan Gong, Alexander H. Liu, Hongyin Luo, Leonid Karlinsky, and James Glass (MIT & MIT-IBM Watson AI Lab). <br>" +
                                     "**Please note that the model is under construction and may be buggy. It is trained with some new techniques that are not described in LTU paper. I.e., using method described in LTU paper cannot reproduce this model.**<br>" +
-                                    "Input should be wav file sampled at 16kHz. This demo trim input audio to 10 seconds."
                                     "**Research Demo, No Commercial Use (Due to license of LLaMA).**")
     demo.launch(debug=False, share=False)

 import json
 import gradio as gr
 import requests
+import os
+def is_file_larger_than_30mb(file_path):
+    try:
+        file_size = os.path.getsize(file_path)
+        return file_size > (30 * 1024 * 1024)
+    except FileNotFoundError:
+        return False
+    except PermissionError:
+        return False
+    except Exception as e:
+        return False
 def upload_audio(audio_path):
     try:
+        size = is_file_larger_than_30mb(audio_path)
+        if size == True:
+            return 'size'
         with open(audio_path, 'rb') as audio_file:
             response = requests.post('http://sls-titan-6.csail.mit.edu:8080/upload/', files={'audio_file': audio_file})
         if response.status_code == 200:
     upload_statues = upload_audio(audio_path)
     if upload_statues == None:
         return 'Please upload an audio file.'
+    if upload_statues == 'size':
+        return 'This demo does not support audio file size larger than 30MB.'
     if question == '':
         return 'Please ask a question.'
     print(audio_path, question)
                         description="LTU-2 an improved version of LTU. LTU-2 is stronger in spoken text understanding and music understanding. <br>" +
                                     "LTU is authored by Yuan Gong, Alexander H. Liu, Hongyin Luo, Leonid Karlinsky, and James Glass (MIT & MIT-IBM Watson AI Lab). <br>" +
                                     "**Please note that the model is under construction and may be buggy. It is trained with some new techniques that are not described in LTU paper. I.e., using method described in LTU paper cannot reproduce this model.**<br>" +
+                                    "Input should be wav file sampled at 16kHz. This demo trim input audio to 10 seconds. <br>"
                                     "**Research Demo, No Commercial Use (Due to license of LLaMA).**")
     demo.launch(debug=False, share=False)