Spaces:

adititewari
/

SoundScripter

Sleeping

Aditi Tewari commited on Feb 4, 2024

Commit

b77c785

1 Parent(s): b7fe9cf

Update backend and frontend

Files changed (2) hide show

soundscripter.html CHANGED Viewed

@@ -16,7 +16,7 @@
 <nav class="navbar" style="background-color:whitesmoke; height:98px; border-radius:30px" >
   <div>
-    <img src="wave.png" alt="SoundScripter" width="60" height="70" style="margin-top:-5px">
     <span class="navbar-brand" style="font-size:35px;"><b>SoundScripter</b></span>
   </div>
   <h5>Automatic Speech Recognition</h5>
@@ -117,7 +117,7 @@
       })
         .then((response) => response.json())
         .then((data) => {
-          if (data.Text) {
             outputText.value = data.text;
           } else {
             outputText.value = "No text recognized.";

 <nav class="navbar" style="background-color:whitesmoke; height:98px; border-radius:30px" >
   <div>
+    <img src="https://huggingface.co/spaces/adititewari/SoundScripter/blob/main/wave.png" alt="SoundScripter" width="60" height="70" style="margin-top:-5px">
     <span class="navbar-brand" style="font-size:35px;"><b>SoundScripter</b></span>
   </div>
   <h5>Automatic Speech Recognition</h5>
       })
         .then((response) => response.json())
         .then((data) => {
+          if (data.text) {
             outputText.value = data.text;
           } else {
             outputText.value = "No text recognized.";

soundscripter_flaskAPI.py CHANGED Viewed

@@ -30,7 +30,8 @@ async def read_root():
     # Provide the path to the HTML file containing the front-end code
     with open("soundscripter.html", "r") as file:
         html_content = file.read()
-    return HTMLResponse(content=html_content)
 def convert_audio_format(input_data, input_format, output_format='wav'):
@@ -52,11 +53,11 @@ def recognize_speech(audio_data, language="hi-IN"):
         return f"API request failed: {e}"
 @app.post("/asr")
-async def transcribe_audio(file: UploadFile = File(...)):
-    contents = await file.read()
     # Determine the input audio format (assumes the format is part of the file name)
-    input_format = file.filename.split('.')[-1].lower()
     # Convert audio to WAV format
     wav_data = convert_audio_format(contents, input_format)
@@ -68,7 +69,8 @@ async def transcribe_audio(file: UploadFile = File(...)):
     # Transcribe the audio
     result = recognize_speech(wav_data)
     # return {"Text": result}
     return JSONResponse(content={"text": result})

     # Provide the path to the HTML file containing the front-end code
     with open("soundscripter.html", "r") as file:
         html_content = file.read()
+    # return HTMLResponse(content=html_content)
+    return html_content
 def convert_audio_format(input_data, input_format, output_format='wav'):
         return f"API request failed: {e}"
 @app.post("/asr")
+async def transcribe_audio(audio: UploadFile = File(...)):
+    contents = await audio.read()
     # Determine the input audio format (assumes the format is part of the file name)
+    input_format = audio.filename.split('.')[-1].lower()
     # Convert audio to WAV format
     wav_data = convert_audio_format(contents, input_format)
     # Transcribe the audio
     result = recognize_speech(wav_data)
+    print(result)
+    # print(JSONResponse(content={"text": result}))
     # return {"Text": result}
     return JSONResponse(content={"text": result})