Spaces:
Running
Running
Fix bug
Browse files- app.py +3 -1
- requirements.txt +1 -1
app.py
CHANGED
@@ -74,10 +74,12 @@ def greet(image, audio):
|
|
74 |
title = "Audio-Grounded Contrastive Learning"
|
75 |
|
76 |
description = """<p>
|
77 |
-
This is a simple demo of Can CLIP Help Sound Source Localization? (WACV2024), zero-shot visual sound localization
|
78 |
To use it simply upload an image and corresponding audio to mask (identify in the image), or use one of the examples below and click ‘submit’.
|
79 |
</p>"""
|
80 |
|
|
|
|
|
81 |
demo = gr.Interface(
|
82 |
fn=greet,
|
83 |
inputs=[gr.Image(type='pil'), gr.Audio()],
|
|
|
74 |
title = "Audio-Grounded Contrastive Learning"
|
75 |
|
76 |
description = """<p>
|
77 |
+
This is a simple demo of Can CLIP Help Sound Source Localization? (WACV2024), zero-shot visual sound localization.<br><br>
|
78 |
To use it simply upload an image and corresponding audio to mask (identify in the image), or use one of the examples below and click ‘submit’.
|
79 |
</p>"""
|
80 |
|
81 |
+
article = "<p style='text-align: center'><a href='https://arxiv.org/abs/2311.04066'>Can CLIP Help Sound Source Localization?</a> | <a href='https://github.com/swimmiing/ACL-SSL'>Offical Github repo</a></p>"
|
82 |
+
|
83 |
demo = gr.Interface(
|
84 |
fn=greet,
|
85 |
inputs=[gr.Image(type='pil'), gr.Audio()],
|
requirements.txt
CHANGED
@@ -3,4 +3,4 @@ torchvision==0.14.0
|
|
3 |
torchaudio==0.13.0
|
4 |
transformers==4.25.1
|
5 |
Pillow
|
6 |
-
opencv-python
|
|
|
3 |
torchaudio==0.13.0
|
4 |
transformers==4.25.1
|
5 |
Pillow
|
6 |
+
opencv-python
|