Spaces:
Running
on
Zero
Running
on
Zero
Aboubacar OUATTARA - kaira
commited on
Commit
•
42d17d1
1
Parent(s):
a848bf6
add audios files
Browse files
app.py
CHANGED
@@ -102,10 +102,14 @@ def enhance_speech(audio_array, sampling_rate, solver, nfe, tau, denoise_before_
|
|
102 |
lambd = 0.9 if denoise_before_enhancement else 0.1
|
103 |
|
104 |
denoised_audio, new_sr1 = denoise(audio_array, sampling_rate, device)
|
105 |
-
enhanced_audio, new_sr2 = enhance(audio_array, sampling_rate, device, nfe=nfe, solver=solver, lambd=lambd, tau=tau)
|
106 |
|
107 |
# Convert to numpy and return
|
108 |
-
return (
|
|
|
|
|
|
|
|
|
109 |
|
110 |
|
111 |
def convert_to_int16(audio_array):
|
@@ -138,21 +142,21 @@ def _fn(
|
|
138 |
else:
|
139 |
audio_array, sampling_rate = text_to_speech(bambara_text)
|
140 |
|
141 |
-
#
|
142 |
-
|
143 |
-
|
144 |
-
|
145 |
-
|
146 |
-
|
147 |
-
|
148 |
-
|
149 |
-
|
150 |
|
151 |
# Return all outputs
|
152 |
return (
|
153 |
bambara_text,
|
154 |
(sampling_rate, audio_array.numpy()),
|
155 |
-
|
156 |
# (enhanced_audio[0], convert_to_int16(enhanced_audio[1]))
|
157 |
)
|
158 |
|
|
|
102 |
lambd = 0.9 if denoise_before_enhancement else 0.1
|
103 |
|
104 |
denoised_audio, new_sr1 = denoise(audio_array, sampling_rate, device)
|
105 |
+
# enhanced_audio, new_sr2 = enhance(audio_array, sampling_rate, device, nfe=nfe, solver=solver, lambd=lambd, tau=tau)
|
106 |
|
107 |
# Convert to numpy and return
|
108 |
+
return (
|
109 |
+
(new_sr1, denoised_audio.cpu().numpy()),
|
110 |
+
None
|
111 |
+
# (new_sr2, enhanced_audio.cpu().numpy())
|
112 |
+
)
|
113 |
|
114 |
|
115 |
def convert_to_int16(audio_array):
|
|
|
142 |
else:
|
143 |
audio_array, sampling_rate = text_to_speech(bambara_text)
|
144 |
|
145 |
+
# Step 3: Enhance the audio
|
146 |
+
denoised_audio, _ = enhance_speech(
|
147 |
+
audio_array,
|
148 |
+
sampling_rate,
|
149 |
+
solver,
|
150 |
+
nfe,
|
151 |
+
prior_temp,
|
152 |
+
denoise_before_enhancement
|
153 |
+
)
|
154 |
|
155 |
# Return all outputs
|
156 |
return (
|
157 |
bambara_text,
|
158 |
(sampling_rate, audio_array.numpy()),
|
159 |
+
denoised_audio,
|
160 |
# (enhanced_audio[0], convert_to_int16(enhanced_audio[1]))
|
161 |
)
|
162 |
|