Spaces:
Build error
Build error
Update audio_foundation_models.py
Browse files
audio_foundation_models.py
CHANGED
@@ -556,7 +556,7 @@ class SoundDetection:
|
|
556 |
self.model.to(device)
|
557 |
|
558 |
@prompts(name="Detect The Sound Event From The Audio",
|
559 |
-
description="useful for when you want to know what event in the audio and the sound event start or end time, "
|
560 |
"receives audio_path as input. "
|
561 |
"The input to this tool should be a string, "
|
562 |
"representing the audio_path. " )
|
@@ -769,7 +769,8 @@ class TargetSoundDetection:
|
|
769 |
"The input to this tool should be a comma seperated string of two, "
|
770 |
"representing audio path and the text description. " )
|
771 |
|
772 |
-
def inference(self,
|
|
|
773 |
target_emb = self.build_clip(text) # torch type
|
774 |
idx = self.cal_similarity(target_emb, self.re_embeds)
|
775 |
target_event = self.id_to_event[idx]
|
|
|
556 |
self.model.to(device)
|
557 |
|
558 |
@prompts(name="Detect The Sound Event From The Audio",
|
559 |
+
description="useful for when you want to know what event in the audio and the sound event start or end time, it will return an image "
|
560 |
"receives audio_path as input. "
|
561 |
"The input to this tool should be a string, "
|
562 |
"representing the audio_path. " )
|
|
|
769 |
"The input to this tool should be a comma seperated string of two, "
|
770 |
"representing audio path and the text description. " )
|
771 |
|
772 |
+
def inference(self, inputs):
|
773 |
+
audio_path, text = inputs.split(",")[0], ','.join(inputs.split(',')[1:])
|
774 |
target_emb = self.build_clip(text) # torch type
|
775 |
idx = self.cal_similarity(target_emb, self.re_embeds)
|
776 |
target_event = self.id_to_event[idx]
|