demucs-source-separation

Running

lllindsey0615 commited on Sep 26

Commit

29ead22

1 Parent(s): f489d22

solving tensor dimension mismatch issue

Files changed (1) hide show

app.py CHANGED Viewed

@@ -47,8 +47,20 @@ def separate_all_stems(audio_file_path: str, model_name: str):
     sr = signal.sample_rate
-    waveform = signal.audio_data.float()  # [channels, samples]
-    waveform = waveform.unsqueeze(0)      # [1, channels, samples]
     with torch.no_grad():
         stems_batch = apply_model(

     sr = signal.sample_rate
+    # Ensure audio_data is a torch.Tensor
+    audio = signal.audio_data
+    if isinstance(audio, np.ndarray):
+        audio = torch.from_numpy(audio)
+    audio = audio.float()  # [channels, samples] or [channels, samples, ?]
+    # Remove extra trailing dimensions
+    if audio.ndim > 2:
+        audio = audio.squeeze()
+    # Final shape: [1, channels, samples]
+    waveform = audio.unsqueeze(0)
     with torch.no_grad():
         stems_batch = apply_model(