Update utils.py
Browse files
utils.py
CHANGED
|
@@ -1912,13 +1912,7 @@ def extract_speech_token(model, feature_extractor, utts, batch_size=128):
|
|
| 1912 |
# make sure kernel also on device
|
| 1913 |
if hasattr(_resample_buffer[sample_rate], "kernel"):
|
| 1914 |
_resample_buffer[sample_rate].kernel = _resample_buffer[sample_rate].kernel.to(device)
|
| 1915 |
-
|
| 1916 |
-
audio_device = audio.device
|
| 1917 |
-
audio = audio.cpu()
|
| 1918 |
-
audio = _resample_buffer[sample_rate](audio)
|
| 1919 |
-
audio = audio.to(audio_device)
|
| 1920 |
-
else:
|
| 1921 |
-
audio = _resample_buffer[sample_rate](audio)
|
| 1922 |
# if audio.shape[0] > 1:
|
| 1923 |
# audio = audio[:1]
|
| 1924 |
audio = audio[0]
|
|
|
|
| 1912 |
# make sure kernel also on device
|
| 1913 |
if hasattr(_resample_buffer[sample_rate], "kernel"):
|
| 1914 |
_resample_buffer[sample_rate].kernel = _resample_buffer[sample_rate].kernel.to(device)
|
| 1915 |
+
audio = _resample_buffer[sample_rate](audio)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1916 |
# if audio.shape[0] > 1:
|
| 1917 |
# audio = audio[:1]
|
| 1918 |
audio = audio[0]
|