@inproceedings{29dae60873b843d5bfd98828ab7236cf,
title = "Visual Tracking with Attentional Convolutional Siamese Networks",
abstract = "Recently Siamese trackers have drawn great attention due to their considerable accuracy and speed. To further improve the discriminability of Siamese networks for visual tracking, some deeper networks, such as VGG and ResNet, are exploited as backbone. However, high-level semantic information reduces the location discrimination. In this paper, we propose a novel Attentional Convolutional Siamese Networks for visual tracking (ACST), to improve the classical AlexNet by fusing spatial and channel attentions during feature learning. Moreover, a response-based weighted sampling strategy during training is proposed to strengthen the discrimination power to distinguish two objects with the similar attributes. With the efficiency of cross-correlation operator, our tracker can be trained end-to-end while running in real-time at inference phase. We validate our tracker through extensive experiments on OTB2013 and OTB2015, and results show that the proposed tracker obtains great improvements over the other Siamese trackers.",
keywords = "Siamese networks, Visual attentions, Visual tracking",
author = "Ke Tan and Zhenzhong Wei",
note = "Publisher Copyright: {\textcopyright} 2019, Springer Nature Switzerland AG.; 10th International Conference on Image and Graphics, ICIG 2019 ; Conference date: 23-08-2019 Through 25-08-2019",
year = "2019",
doi = "10.1007/978-3-030-34120-6\_30",
language = "英语",
isbn = "9783030341190",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer",
pages = "369--380",
editor = "Yao Zhao and Chunyu Lin and Nick Barnes and Baoquan Chen and R{\"u}diger Westermann and Xiangwei Kong",
booktitle = "Image and Graphics - 10th International Conference, ICIG 2019, Proceedings, Part 1",
address = "德国",
}