@inproceedings{01b3197e254a4d519f59c832aee56dcb,
title = "Information Lossless Multi-modal Image Generation for RGB-T Tracking",
abstract = "Visible-Thermal infrared(RGB-T) multimodal target representation is a key issue affecting RGB-T tracking performance. It is difficult to train a RGB-T fusion tracker in an end-to-end way, due to the lack of annotated RGB-T image pairs as training data. To relieve above problems, we propose an information lossless RGB-T image pair generation method. We generate the TIR data from the massive RGB labeling data, and these aligned RGB-T data pair with labels are used for RGB-T fusion target tracking. Different from the traditional image modal conversion model, this paper uses a reversible neural network to realize the conversion of RGB modal to TIR modal images. The advantage of this method is that it can generate information lossless TIR modal data. Specifically, we design reversible modules and reversible operations for the RGB-T modal conversion task by exploiting the properties of reversible network structure. Then, it does not lose information and train on a large amount of aligned RGB-T data. Finally, the trained model is added to the RGB-T fusion tracking framework to generate paired RGB-T images end-to-end. We conduct adequate experiments on the VOT-RGBT2020 [14] and RGBT234 [16] datasets, the experimental results show that our method can obtain better RGB-T fusion features to represent the target. The performance on the VOT-RGBT2020 [14] and RGBT234 [16] datasets is 4.6% and 4.9% better than the baseline in EAO and Precision rate, respectively.",
keywords = "Data generation, Reversible network, RGB-T tracking",
author = "Fan Li and Yufei Zha and Lichao Zhang and Peng Zhang and Lang Chen",
note = "Publisher Copyright: {\textcopyright} The Author(s), under exclusive license to Springer Nature Switzerland AG 2022.; 5th Chinese Conference on Pattern Recognition and Computer Vision, PRCV 2022 ; Conference date: 04-11-2022 Through 07-11-2022",
year = "2022",
doi = "10.1007/978-3-031-18916-6_53",
language = "英语",
isbn = "9783031189159",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "671--683",
editor = "Shiqi Yu and Jianguo Zhang and Zhaoxiang Zhang and Tieniu Tan and Yuen, {Pong C.} and Yike Guo and Junwei Han and Jianhuang Lai",
booktitle = "Pattern Recognition and Computer Vision - 5th Chinese Conference, PRCV 2022, Proceedings",
}