app
Browse files- app.py +36 -29
- data/examples/DUT-OMRON_im103.png +0 -0
- data/examples/ECSSD_0010.png +0 -0
- data/examples/ECSSD_0022.png +0 -0
app.py
CHANGED
|
@@ -69,40 +69,47 @@ def predict(img_input):
|
|
| 69 |
return blend_images(img_pil, T.ToPILImage()(preds_up))
|
| 70 |
|
| 71 |
|
| 72 |
-
title = 'FOUND - unsupervised object localization
|
| 73 |
description = 'Gradio Demo for our CVPR23 paper "Unsupervised Object Localization: Observing the Background to Discover Objects"\n \
|
| 74 |
The app is <i>running on CPUs</i>, inference times are therefore longer than those expected on GPU (80 FPS on a V100 GPU).\n \
|
| 75 |
Please see below for more details.'
|
| 76 |
|
| 77 |
-
article = """
|
|
|
|
| 78 |
|
| 79 |
-
|
| 80 |
-
|
| 81 |
-
|
| 82 |
-
|
| 83 |
-
|
| 84 |
-
|
| 85 |
-
|
| 86 |
-
|
| 87 |
-
|
| 88 |
-
|
| 89 |
-
|
| 90 |
-
|
| 91 |
-
|
| 92 |
-
|
| 93 |
-
|
| 94 |
-
|
| 95 |
-
|
| 96 |
-
|
| 97 |
-
|
| 98 |
-
|
| 99 |
-
|
| 100 |
-
|
| 101 |
-
|
| 102 |
-
|
| 103 |
-
|
| 104 |
-
|
| 105 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 106 |
|
| 107 |
|
| 108 |
iface = gr.Interface(fn=predict,
|
|
|
|
| 69 |
return blend_images(img_pil, T.ToPILImage()(preds_up))
|
| 70 |
|
| 71 |
|
| 72 |
+
title = 'FOUND - unsupervised object localization'
|
| 73 |
description = 'Gradio Demo for our CVPR23 paper "Unsupervised Object Localization: Observing the Background to Discover Objects"\n \
|
| 74 |
The app is <i>running on CPUs</i>, inference times are therefore longer than those expected on GPU (80 FPS on a V100 GPU).\n \
|
| 75 |
Please see below for more details.'
|
| 76 |
|
| 77 |
+
article = """
|
| 78 |
+
<h1 align="center">Unsupervised Object Localization: Observing the Background to Discover Objects</h1>
|
| 79 |
|
| 80 |
+
## Highlights
|
| 81 |
+
- Single **conv 1 x 1** layer trained to extract information from DINO [1] features.
|
| 82 |
+
- **No supervision**.
|
| 83 |
+
- Trained only for **2 epochs** on the dataset DUTS-TR.
|
| 84 |
+
- Inference runs at **80 FPS** on a V100 GPU.
|
| 85 |
+
- No post-processing applied in results here.
|
| 86 |
+
|
| 87 |
+
<i> Images provided are taken from VOC07 [2], ECSSD [3] and DUT-OMRON [4].</i>
|
| 88 |
+
|
| 89 |
+
## Citation
|
| 90 |
+
```
|
| 91 |
+
@inproceedings{simeoni2023found,
|
| 92 |
+
author = {Siméoni, Oriane and Sekkat, Chloé and Puy, Gilles and Vobecky, Antonin and Zablocki, Éloi and Pérez, Patrick},
|
| 93 |
+
title = {Unsupervised Object Localization: Observing the Background to Discover Objects},
|
| 94 |
+
booktitle = {{IEEE} Conference on Computer Vision and Pattern Recognition, {CVPR}},
|
| 95 |
+
year = {2023},
|
| 96 |
+
}
|
| 97 |
+
```
|
| 98 |
+
|
| 99 |
+
### References
|
| 100 |
+
|
| 101 |
+
[1] M. Caron et al. Emerging properties in self-supervised vision transformers, ICCV 2021
|
| 102 |
+
[2] M. Everingham et al. The PASCAL Visual Object Classes Challenge 2007 (VOC2007) Results
|
| 103 |
+
[3] J. Shi et al. Hierarchical image saliency detection on extended CSSD, IEEE TPAMI 2016
|
| 104 |
+
[4] C. Yang et al. Saliency detection via graph-based manifold ranking, CVPR 2013
|
| 105 |
+
|
| 106 |
+
"""
|
| 107 |
+
|
| 108 |
+
examples = ["data/examples/VOC_000030.jpg",
|
| 109 |
+
"data/examples/ECSSD_0010.png",
|
| 110 |
+
"data/examples/ECSSD_0022.png",
|
| 111 |
+
"data/examples/DUT-OMRON_im103.png",
|
| 112 |
+
]
|
| 113 |
|
| 114 |
|
| 115 |
iface = gr.Interface(fn=predict,
|
data/examples/DUT-OMRON_im103.png
ADDED
|
data/examples/ECSSD_0010.png
ADDED
|
data/examples/ECSSD_0022.png
ADDED
|