@inproceedings{399d4f907f7a4b8f89fbd4cf9dc4f642,
title = "Zero-Shot Object Detection: Learning to Simultaneously Recognize and Localize Novel Concepts",
abstract = "Current Zero-Shot Learning (ZSL) approaches are restricted to recognition of a single dominant unseen object category in a test image. We hypothesize that this setting is ill-suited for real-world applications where unseen objects appear only as a part of a complex scene, warranting both {\textquoteleft}recognition{\textquoteright} and {\textquoteleft}localization{\textquoteright} of an unseen category. To address this limitation, we introduce a new {\textquoteleft}Zero-Shot Detection{\textquoteright} (ZSD) problem setting, which aims at simultaneously recognizing and locating object instances belonging to novel categories without any training examples. We also propose a new experimental protocol for ZSD based on the highly challenging ILSVRC dataset, adhering to practical issues, e.g., the rarity of unseen objects. To the best of our knowledge, this is the first end-to-end deep network for ZSD that jointly models the interplay between visual and semantic domain information. To overcome the noise in the automatically derived semantic descriptions, we utilize the concept of meta-classes to design an original loss function that achieves synergy between max-margin class separation and semantic space clustering. Furthermore, we present a baseline approach extended from recognition to ZSD setting. Our extensive experiments show significant performance boost over the baseline on the imperative yet difficult ZSD problem.",
keywords = "Object detection, Zero-shot detection, Zero-shot learning",
author = "Shafin Rahman and Salman Khan and Fatih Porikli",
note = "Publisher Copyright: {\textcopyright} 2019, Springer Nature Switzerland AG.; 14th Asian Conference on Computer Vision, ACCV 2018 ; Conference date: 02-12-2018 Through 06-12-2018",
year = "2019",
doi = "10.1007/978-3-030-20887-5_34",
language = "English",
isbn = "9783030208868",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Verlag",
pages = "547--563",
editor = "Konrad Schindler and Hongdong Li and Greg Mori and C.V. Jawahar",
booktitle = "Computer Vision – ACCV 2018 - 14th Asian Conference on Computer Vision, Revised Selected Papers",
address = "Germany",
}