@inproceedings{3fc3e36ca4964a2c9d75eb1288bfe2b2,
title = "Learning spatial transforms for refining object segment proposals",
abstract = "We address the problem of object segment proposal generation, which is a critical step in many instance-level semantic segmentation and scene understanding pipelines. In contrast to prior works that predict binary segment masks from images, we take an alternative refinement approach to improve the quality of a given segment candidate pool. In particular, we propose an efficient deep network that learns 2D spatial transforms to warp an initial object mask towards nearby object region. We formulate this segment refinement task as a regression problem and design a novel feature pooling strategy in our deep network to predict an affine transformation for each object mask. We evaluate our method extensively on two challenging public benchmarks and apply our refinement network to three different initial segment proposal settings. Our results show sizable improvements in average recall across all the settings, achieving the state-of-The-Art performances.",
author = "Haoyang Zhang and Xuming He and Fatih Porikli",
note = "Publisher Copyright: {\textcopyright} 2017 IEEE.; 17th IEEE Winter Conference on Applications of Computer Vision, WACV 2017 ; Conference date: 24-03-2017 Through 31-03-2017",
year = "2017",
month = may,
day = "11",
doi = "10.1109/WACV.2017.12",
language = "English",
series = "Proceedings - 2017 IEEE Winter Conference on Applications of Computer Vision, WACV 2017",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "37--46",
booktitle = "Proceedings - 2017 IEEE Winter Conference on Applications of Computer Vision, WACV 2017",
address = "United States",
}