Spaces:

facebook
/

Hokkien_Demo_on_GPU

Build error

lpw commited on Dec 20, 2022

Commit

418e72c

•

1 Parent(s): 796bd4c

Update audio_pipe.py

Files changed (1) hide show

audio_pipe.py CHANGED Viewed

@@ -5,6 +5,7 @@ from typing import List, Tuple
 import numpy as np
 import torch
 # from app.pipelines import Pipeline
 from fairseq import hub_utils
 from fairseq.checkpoint_utils import load_model_ensemble_and_task_from_hf_hub
@@ -105,7 +106,7 @@ class SpeechToSpeechPipeline():
                     [self.tts_model], tts_cfg
                 )
-    def __call__(self, inputs: np.array) -> Tuple[np.array, int, List[str]]:
         """
         Args:
             inputs (:obj:`np.array`):
@@ -120,7 +121,7 @@ class SpeechToSpeechPipeline():
                     This can be the name of the instruments for audio source separation
                     or some annotation for speech enhancement. The length must be `C'`.
         """
-        _inputs = torch.from_numpy(inputs).unsqueeze(0)
         sample, text = None, None
         if self.cfg.task._name in ["speech_to_text", "speech_to_text_sharded"]:
             sample = S2THubInterface.get_model_input(self.task, _inputs)

 import numpy as np
 import torch
+import torchaudio
 # from app.pipelines import Pipeline
 from fairseq import hub_utils
 from fairseq.checkpoint_utils import load_model_ensemble_and_task_from_hf_hub
                     [self.tts_model], tts_cfg
                 )
+    def __call__(self, inputs: str) -> Tuple[np.array, int, List[str]]:
         """
         Args:
             inputs (:obj:`np.array`):
                     This can be the name of the instruments for audio source separation
                     or some annotation for speech enhancement. The length must be `C'`.
         """
+        _inputs = torchaudio.load(inputs)
         sample, text = None, None
         if self.cfg.task._name in ["speech_to_text", "speech_to_text_sharded"]:
             sample = S2THubInterface.get_model_input(self.task, _inputs)