swimmiing commited on
Commit
a063f1d
1 Parent(s): 9f952e8
Files changed (2) hide show
  1. app.py +3 -1
  2. requirements.txt +1 -1
app.py CHANGED
@@ -74,10 +74,12 @@ def greet(image, audio):
74
  title = "Audio-Grounded Contrastive Learning"
75
 
76
  description = """<p>
77
- This is a simple demo of Can CLIP Help Sound Source Localization? (WACV2024), zero-shot visual sound localization<br><br>.
78
  To use it simply upload an image and corresponding audio to mask (identify in the image), or use one of the examples below and click ‘submit’.
79
  </p>"""
80
 
 
 
81
  demo = gr.Interface(
82
  fn=greet,
83
  inputs=[gr.Image(type='pil'), gr.Audio()],
 
74
  title = "Audio-Grounded Contrastive Learning"
75
 
76
  description = """<p>
77
+ This is a simple demo of Can CLIP Help Sound Source Localization? (WACV2024), zero-shot visual sound localization.<br><br>
78
  To use it simply upload an image and corresponding audio to mask (identify in the image), or use one of the examples below and click ‘submit’.
79
  </p>"""
80
 
81
+ article = "<p style='text-align: center'><a href='https://arxiv.org/abs/2311.04066'>Can CLIP Help Sound Source Localization?</a> | <a href='https://github.com/swimmiing/ACL-SSL'>Offical Github repo</a></p>"
82
+
83
  demo = gr.Interface(
84
  fn=greet,
85
  inputs=[gr.Image(type='pil'), gr.Audio()],
requirements.txt CHANGED
@@ -3,4 +3,4 @@ torchvision==0.14.0
3
  torchaudio==0.13.0
4
  transformers==4.25.1
5
  Pillow
6
- opencv-python==4.8.1.78
 
3
  torchaudio==0.13.0
4
  transformers==4.25.1
5
  Pillow
6
+ opencv-python