app
Browse files- app.py +36 -29
- data/examples/DUT-OMRON_im103.png +0 -0
- data/examples/ECSSD_0010.png +0 -0
- data/examples/ECSSD_0022.png +0 -0
app.py
CHANGED
@@ -69,40 +69,47 @@ def predict(img_input):
|
|
69 |
return blend_images(img_pil, T.ToPILImage()(preds_up))
|
70 |
|
71 |
|
72 |
-
title = 'FOUND - unsupervised object localization
|
73 |
description = 'Gradio Demo for our CVPR23 paper "Unsupervised Object Localization: Observing the Background to Discover Objects"\n \
|
74 |
The app is <i>running on CPUs</i>, inference times are therefore longer than those expected on GPU (80 FPS on a V100 GPU).\n \
|
75 |
Please see below for more details.'
|
76 |
|
77 |
-
article = """
|
|
|
78 |
|
79 |
-
|
80 |
-
|
81 |
-
|
82 |
-
|
83 |
-
|
84 |
-
|
85 |
-
|
86 |
-
|
87 |
-
|
88 |
-
|
89 |
-
|
90 |
-
|
91 |
-
|
92 |
-
|
93 |
-
|
94 |
-
|
95 |
-
|
96 |
-
|
97 |
-
|
98 |
-
|
99 |
-
|
100 |
-
|
101 |
-
|
102 |
-
|
103 |
-
|
104 |
-
|
105 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
106 |
|
107 |
|
108 |
iface = gr.Interface(fn=predict,
|
|
|
69 |
return blend_images(img_pil, T.ToPILImage()(preds_up))
|
70 |
|
71 |
|
72 |
+
title = 'FOUND - unsupervised object localization'
|
73 |
description = 'Gradio Demo for our CVPR23 paper "Unsupervised Object Localization: Observing the Background to Discover Objects"\n \
|
74 |
The app is <i>running on CPUs</i>, inference times are therefore longer than those expected on GPU (80 FPS on a V100 GPU).\n \
|
75 |
Please see below for more details.'
|
76 |
|
77 |
+
article = """
|
78 |
+
<h1 align="center">Unsupervised Object Localization: Observing the Background to Discover Objects</h1>
|
79 |
|
80 |
+
## Highlights
|
81 |
+
- Single **conv 1 x 1** layer trained to extract information from DINO [1] features.
|
82 |
+
- **No supervision**.
|
83 |
+
- Trained only for **2 epochs** on the dataset DUTS-TR.
|
84 |
+
- Inference runs at **80 FPS** on a V100 GPU.
|
85 |
+
- No post-processing applied in results here.
|
86 |
+
|
87 |
+
<i> Images provided are taken from VOC07 [2], ECSSD [3] and DUT-OMRON [4].</i>
|
88 |
+
|
89 |
+
## Citation
|
90 |
+
```
|
91 |
+
@inproceedings{simeoni2023found,
|
92 |
+
author = {Siméoni, Oriane and Sekkat, Chloé and Puy, Gilles and Vobecky, Antonin and Zablocki, Éloi and Pérez, Patrick},
|
93 |
+
title = {Unsupervised Object Localization: Observing the Background to Discover Objects},
|
94 |
+
booktitle = {{IEEE} Conference on Computer Vision and Pattern Recognition, {CVPR}},
|
95 |
+
year = {2023},
|
96 |
+
}
|
97 |
+
```
|
98 |
+
|
99 |
+
### References
|
100 |
+
|
101 |
+
[1] M. Caron et al. Emerging properties in self-supervised vision transformers, ICCV 2021
|
102 |
+
[2] M. Everingham et al. The PASCAL Visual Object Classes Challenge 2007 (VOC2007) Results
|
103 |
+
[3] J. Shi et al. Hierarchical image saliency detection on extended CSSD, IEEE TPAMI 2016
|
104 |
+
[4] C. Yang et al. Saliency detection via graph-based manifold ranking, CVPR 2013
|
105 |
+
|
106 |
+
"""
|
107 |
+
|
108 |
+
examples = ["data/examples/VOC_000030.jpg",
|
109 |
+
"data/examples/ECSSD_0010.png",
|
110 |
+
"data/examples/ECSSD_0022.png",
|
111 |
+
"data/examples/DUT-OMRON_im103.png",
|
112 |
+
]
|
113 |
|
114 |
|
115 |
iface = gr.Interface(fn=predict,
|
data/examples/DUT-OMRON_im103.png
ADDED
![]() |
data/examples/ECSSD_0010.png
ADDED
![]() |
data/examples/ECSSD_0022.png
ADDED
![]() |