ClearVoice-SR

Running on Zero

alibabasglab commited on Oct 17, 2024

Commit

3956066

verified ·

1 Parent(s): bdaf47a

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -6,28 +6,29 @@ from clearvoice import ClearVoice
 myClearVoice = ClearVoice(task='speech_enhancement', model_names=['FRCRN_SE_16K'])
 def fn_clearvoice(aud):
-    # Load and add fake batch dimension
-    """
-    noisy = enhance_model.load_audio(
-    aud
-    ).unsqueeze(0)
-    enhanced = enhance_model.enhance_batch(noisy, lengths=torch.tensor([1.]))
-    """
     output_wav_dict = myClearVoice(input_path='input.wav', online_write=False)
     if isinstance(output_wav_dict, dict):
         key = next(iter(output_wav_dict))
         output_wav = output_wav_dict[key]
     else:
         output_wav = output_wav_dict
-    sf.write('enhanced.wav', output_wav, 16000)
     return 'enhanced.wav'
-inputs = gr.Audio(sources=["upload"], label="Input Audio", type="filepath")
-outputs = gr.Audio(label="Output Audio", type="filepath")
-title = "ClearVoice"
-description = "Gradio demo for Speech enhancement with ClearVoice. To use it, simply upload your audio, or click one of the examples to load them. Read more at the links below."
-article = "<p style='text-align: center'><a href='https://arxiv.org/abs/2206.07293' target='_blank'>FRCRN: Boosting Feature Representation Using Frequency Recurrence for Monaural Speech Enhancement</a> | <a href='https://github.com/speechbrain/speechbrain' target='_blank'>Github Repo</a></p>"
-examples = [
-    ['input.wav']
-]
-gr.Interface(fn_clearvoice, inputs, outputs, title=title, description=description, article=article, examples=examples).launch()

 myClearVoice = ClearVoice(task='speech_enhancement', model_names=['FRCRN_SE_16K'])
 def fn_clearvoice(aud):
     output_wav_dict = myClearVoice(input_path='input.wav', online_write=False)
     if isinstance(output_wav_dict, dict):
         key = next(iter(output_wav_dict))
         output_wav = output_wav_dict[key]
     else:
         output_wav = output_wav_dict
+    #sf.write('enhanced.wav', output_wav, 16000)
     return 'enhanced.wav'
+se_demo = gr.Interface(
+    fn=fn_clearvoice,
+    inputs = [
+        gr.Audio(sources=["upload"], label="Input Audio", type="filepath")
+    ],
+    outputs = [
+        gr.Audio(label="Output Audio", type="filepath")
+    ],
+    title = "ClearVoice",
+    description = ("Gradio demo for Speech enhancement with ClearVoice. To use it, simply upload your audio, or click one of the examples to load them. Read more at the links below."),
+    article = ("<p style='text-align: center'><a href='https://arxiv.org/abs/2206.07293' target='_blank'>FRCRN: Boosting Feature Representation Using Frequency Recurrence for Monaural Speech Enhancement</a> | <a href='https://github.com/speechbrain/speechbrain' target='_blank'>Github Repo</a></p>"),
+    examples = [
+        ['input.wav']
+    ]
+    cache_examples = True,
+)
+se_demo.launch()