@inproceedings{9b3e98b2890a43e89c8bde75c4812316,
title = "Robust and real-time deep tracking via multi-scale domain adaptation",
abstract = "Visual tracking is a fundamental problem in computer vision. Recently, some deep-learning-based tracking algorithms have been achieving record-breaking performances. However, due to the high complexity of deep learning, most deep trackers suffer from low tracking speed, and thus are impractical in many real-world applications. Some new deep trackers with smaller network structure achieve high efficiency while at the cost of significant decrease on precision. In this paper, we propose to transfer the feature for image classification to the visual tracking domain via convolutional channel reductions. The channel reduction could be simply viewed as an additional convolutional layer with the specific task. It not only extracts useful information for object tracking but also significantly increases the tracking speed. To better accommodate the useful feature of the target in different scales, the adaptation filters are designed with different sizes. The yielded visual tracker is real-time and also illustrates the state-of-the-art accuracies in the experiment involving two well-adopted benchmarks with more than 100 test videos.",
keywords = "Deep learning, Real-time, Visual tracking",
author = "Xinyu Wang and Hanxi Li and Yi Li and Fumin Shen and Fatih Porikli",
note = "Publisher Copyright: {\textcopyright} 2017 IEEE.; 2017 IEEE International Conference on Multimedia and Expo, ICME 2017 ; Conference date: 10-07-2017 Through 14-07-2017",
year = "2017",
month = aug,
day = "28",
doi = "10.1109/ICME.2017.8019450",
language = "English",
series = "Proceedings - IEEE International Conference on Multimedia and Expo",
publisher = "IEEE Computer Society",
pages = "1338--1343",
booktitle = "2017 IEEE International Conference on Multimedia and Expo, ICME 2017",
address = "United States",
}