Spaces:

Siddhant
/

ESPnet2-SLU

Runtime error

ssiidd commited on Nov 14, 2021

Commit

12c22ef

1 Parent(s): 9568053

Add fairseq installation

Files changed (1) hide show

app.py CHANGED Viewed

@@ -46,13 +46,19 @@ def inference(wav,data):
           action=intent.split("_")[1]
           text="{scenario: "+scenario+", action: "+action+"}"
       elif data == "english_fsc":
           speech, rate = soundfile.read(wav.name)
           nbests = speech2text_fsc(speech)
           text, *_ = nbests[0]
           intent=text.split(" ")[0]
           action=intent.split("_")[0]
           objects=intent.split("_")[1]
-          location=intent.split("_")[1]
           text="{action: "+action+", object: "+objects+", location: "+location+"}"
       # if lang == "chinese":
       #     wav = text2speechch(text)["wav"]

           action=intent.split("_")[1]
           text="{scenario: "+scenario+", action: "+action+"}"
       elif data == "english_fsc":
+          print(wav.name)
           speech, rate = soundfile.read(wav.name)
+          print(speech.shape)
+          if len(speech.shape)==2:
+            speech=speech[:,0]
+            # soundfile.write("store_file.wav", speech, rate, subtype='FLOAT')
+          print(speech.shape)
           nbests = speech2text_fsc(speech)
           text, *_ = nbests[0]
           intent=text.split(" ")[0]
           action=intent.split("_")[0]
           objects=intent.split("_")[1]
+          location=intent.split("_")[2]
           text="{action: "+action+", object: "+objects+", location: "+location+"}"
       # if lang == "chinese":
       #     wav = text2speechch(text)["wav"]