app
Browse files
app.py
CHANGED
@@ -69,7 +69,7 @@ def predict(img_input):
|
|
69 |
return blend_images(img_pil, T.ToPILImage()(preds_up))
|
70 |
|
71 |
|
72 |
-
title = 'FOUND - unsupervised object localization'
|
73 |
description = 'Gradio Demo for our CVPR23 paper "Unsupervised Object Localization: Observing the Background to Discover Objects"\n \
|
74 |
The app is <i>running on CPUs</i>, inference times are therefore longer than those expected on GPU (80 FPS on a V100 GPU).\n \
|
75 |
Please see below for more details.'
|
@@ -77,10 +77,30 @@ description = 'Gradio Demo for our CVPR23 paper "Unsupervised Object Localizatio
|
|
77 |
article = """<h1 align="center">Unsupervised Object Localization: Observing the Background to Discover Objects </h1>
|
78 |
|
79 |
## Highlights
|
80 |
-
|
|
|
81 |
- Trained only for 2 epochs on the dataset DUTS-TR.
|
82 |
- Inference runs at 80 FPS on a V100 GPU.
|
83 |
- No post-processing applied in results here.
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
84 |
"""
|
85 |
examples = ["data/examples/VOC_000030.jpg"]
|
86 |
|
|
|
69 |
return blend_images(img_pil, T.ToPILImage()(preds_up))
|
70 |
|
71 |
|
72 |
+
title = 'FOUND - unsupervised object localization \n CVPR23'
|
73 |
description = 'Gradio Demo for our CVPR23 paper "Unsupervised Object Localization: Observing the Background to Discover Objects"\n \
|
74 |
The app is <i>running on CPUs</i>, inference times are therefore longer than those expected on GPU (80 FPS on a V100 GPU).\n \
|
75 |
Please see below for more details.'
|
|
|
77 |
article = """<h1 align="center">Unsupervised Object Localization: Observing the Background to Discover Objects </h1>
|
78 |
|
79 |
## Highlights
|
80 |
+
|
81 |
+
- Single **conv 1 x 1** layer trained to extract information from DINO [1] features.
|
82 |
- Trained only for 2 epochs on the dataset DUTS-TR.
|
83 |
- Inference runs at 80 FPS on a V100 GPU.
|
84 |
- No post-processing applied in results here.
|
85 |
+
|
86 |
+
<i> Images provided are taken from VOC07 [2], ECSSD [3] and DUT-OMRON [4].</i>
|
87 |
+
|
88 |
+
## Citation
|
89 |
+
```
|
90 |
+
@inproceedings{simeoni2023found,
|
91 |
+
author = {Siméoni, Oriane and Sekkat, Chloé and Puy, Gilles and Vobecky, Antonin and Zablocki, Éloi and Pérez, Patrick},
|
92 |
+
title = {Unsupervised Object Localization: Observing the Background to Discover Objects},
|
93 |
+
booktitle = {{IEEE} Conference on Computer Vision and Pattern Recognition, {CVPR}},
|
94 |
+
year = {2023},
|
95 |
+
}
|
96 |
+
```
|
97 |
+
|
98 |
+
### References
|
99 |
+
|
100 |
+
[1] M. Caron et al. Emerging properties in self-supervised vision transformers, ICCV 2021
|
101 |
+
[2] M. Everingham et al. The PASCAL Visual Object Classes Challenge 2007 (VOC2007) Results
|
102 |
+
[3] J. Shi et al. Hierarchical image saliency detection on extended CSSD, IEEE TPAMI 2016
|
103 |
+
[4] C. Yang et al. Saliency detection via graph-based manifold ranking, CVPR 2013
|
104 |
"""
|
105 |
examples = ["data/examples/VOC_000030.jpg"]
|
106 |
|