@inproceedings{f4c7495f40ad466c92c8b9be5176acfc,
title = "3D Guided Weakly Supervised Semantic Segmentation",
abstract = "Pixel-wise clean annotation is necessary for fully-supervised semantic segmentation, which is laborious and expensive to obtain. In this paper, we propose a weakly supervised 2D semantic segmentation model by incorporating sparse bounding box labels with available 3D information, which is much easier to obtain with advanced sensors. We introduce a 2D-3D inference module to generate accurate pixel-wise segment proposal masks. Guided by 3D information, we first generate a point cloud of objects and calculate a per class objectness probability score for each point using projected bounding-boxes. Then we project the point cloud with objectness probabilities back to the 2D images followed by a refinement step to obtain segment proposals, which are treated as pseudo labels to train a semantic segmentation network. Our method works in a recursive manner to gradually refine the above-mentioned segment proposals. We conducted extensive experimental results on the 2D-3D-S dataset where we manually labeled a subset of images with bounding boxes. We show that the proposed method can generate accurate segment proposals when bounding box labels are available on only a small subset of training images. Performance comparison with recent state-of-the-art methods further illustrates the effectiveness of our method.",
keywords = "3D guidance, Semantic segmentation, Weak supervision",
author = "Weixuan Sun and Jing Zhang and Nick Barnes",
note = "Publisher Copyright: {\textcopyright} 2021, Springer Nature Switzerland AG.; 15th Asian Conference on Computer Vision, ACCV 2020 ; Conference date: 30-11-2020 Through 04-12-2020",
year = "2021",
doi = "10.1007/978-3-030-69525-5_35",
language = "English",
isbn = "9783030695248",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "585--602",
editor = "Hiroshi Ishikawa and Cheng-Lin Liu and Tomas Pajdla and Jianbo Shi",
booktitle = "Computer Vision – ACCV 2020 - 15th Asian Conference on Computer Vision, 2020, Revised Selected Papers",
address = "Germany",
}